diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..87d71738135a2cd7e041676a0fa34ab387014396 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +ToMh_dataset/media/Picture1.png filter=lfs diff=lfs merge=lfs -text diff --git a/ToMh_dataset/.DS_Store b/ToMh_dataset/.DS_Store new file mode 100644 index 0000000000000000000000000000000000000000..172a526a215fcc1cb447c4ce4612c4389d62e606 Binary files /dev/null and b/ToMh_dataset/.DS_Store differ diff --git a/ToMh_dataset/.gitignore b/ToMh_dataset/.gitignore new file mode 100644 index 0000000000000000000000000000000000000000..a9c9a4c28cec4c113dd94a1ae1da735871f23042 --- /dev/null +++ b/ToMh_dataset/.gitignore @@ -0,0 +1,93 @@ +# Byte-compiled / optimized / DLL files +__pycache__/ +*.py[cod] +*$py.class + +# C extensions +*.so + +# Distribution / packaging +.Python +env/ +build/ +develop-eggs/ +dist/ +downloads/ +eggs/ +.eggs/ +lib/ +lib64/ +parts/ +sdist/ +var/ +*.egg-info/ +.installed.cfg +*.egg + +# PyInstaller +# Usually these files are written by a python script from a template +# before PyInstaller builds the exe, so as to inject date/other infos into it. +*.manifest +*.spec + +# Installer logs +pip-log.txt +pip-delete-this-directory.txt + +# Unit test / coverage reports +htmlcov/ +.tox/ +.coverage +.coverage.* +.cache +nosetests.xml +coverage.xml +*,cover +.hypothesis/ + +# Translations +*.mo +*.pot + +# Django stuff: +*.log +local_settings.py + +# Flask stuff: +instance/ +.webassets-cache + +# Scrapy stuff: +.scrapy + +# Sphinx documentation +docs/_build/ + +# PyBuilder +target/ + +# IPython Notebook +.ipynb_checkpoints + +# pyenv +.python-version + +# celery beat schedule file +celerybeat-schedule + +# dotenv +.env + +# virtualenv +venv/ +ENV/ + +# Spyder project settings +.spyderproject + +# Rope project settings +.ropeproject + +# Project-specific directories +*_responses/ +Analyze_script/ diff --git a/ToMh_dataset/.gitmodules b/ToMh_dataset/.gitmodules new file mode 100644 index 0000000000000000000000000000000000000000..226a7b55b007ca6f9070e52630c58fc0eb8ec52d --- /dev/null +++ b/ToMh_dataset/.gitmodules @@ -0,0 +1,9 @@ +[submodule "models/EntNet"] + path = models/EntNet + url = https://github.com/kayburns/EntNet.git +[submodule "models/MemN2NandMultObs"] + path = models/MemN2NandMultObs + url = https://github.com/kayburns/MemN2NandMultObs.git +[submodule "models/relation-network"] + path = models/relation-network + url = git@github.com:eringrant/relation-network.git diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..383134fe7c11fa9a972caf3ead72f09b9833fe7b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_1/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where is the lettuce really? +Answer: green_drawer +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3b4f349179dc85b8c7327950023f2e1ce0d3f864 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_1/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Avery really think the lettuce is? +Answer: green_bathtub +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..288ac6977fdadacc0b92f988de27053889f97671 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_1/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Charlotte think Avery thinks the lettuce is? +Answer: green_bathtub +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6a92d4535d46e2afc30a80b4ed3b0975bc2c173d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_1/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Owen think Charlotte thinks Avery thinks the lettuce is? +Answer: green_bathtub +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +*** \ No newline at end of file diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4159830c1732706e454930728c7f8f3d265ebaa2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_1/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Isabella think Owen thinks Charlotte thinks Avery thinks the lettuce is? +Answer: green_bathtub +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +*** \ No newline at end of file diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..65ada6fd01ce063062463ee5c2983c6970d7e6b7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_10/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where is the plum really? +Answer: red_pantry +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1193db251b7a4b4235f661d292c6b8e0cd94b4e6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_10/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does William really think the plum is? +Answer: green_bucket +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..bec176f08303d205d2306d07396a0a29126cc961 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_10/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does Nathan think William thinks the plum is? +Answer: red_pantry +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a51082ddd05605610351adc42ad135437c1ed3dd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_10/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does Evelyn think Nathan thinks William thinks the plum is? +Answer: red_pantry +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a20ffc20fa0d0d341896576484d06b162938dde6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_10/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does Jacob think Evelyn thinks Nathan thinks William thinks the plum is? +Answer: red_pantry +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..80e4483d16a6794e35bbe283209038776c62f497 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_11/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where is the orange really? +Answer: red_box +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6206b15c117f44c95e4d14958fc5f499a311666f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_11/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Ella really think the orange is? +Answer: red_envelope +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..605958f88bbf81c9c249c70a842bb12e6dcfc983 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_11/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Elizabeth think Ella thinks the orange is? +Answer: red_envelope +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..3b2c60a866a6df10e3dc1ffab6dfbcfbf35e6b8d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_11/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Chloe think Elizabeth thinks Ella thinks the orange is? +Answer: red_box +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..034997268bea1e3307e05b72c21592a0166bef1a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_11/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Alexander think Chloe thinks Elizabeth thinks Ella thinks the orange is? +Answer: red_box +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5ef9a56b0f5511ef48efe9fbf3a589a6ace323d3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_12/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where is the melon really? +Answer: red_bottle +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2138e092ecb7957d2a66031fdd88e73497039c52 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_12/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does William really think the melon is? +Answer: red_bottle +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1d4513403e0c27da378469d6efc0c8ff5fd9cc8e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_12/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does Mila think William thinks the melon is? +Answer: green_box +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1c4a596b22dd4ee7661f53c9b450779fefecf4c8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_12/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does Ella think Mila thinks William thinks the melon is? +Answer: green_box +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..062ee3b09321cdd7c7e705860023b4a9b0f5a3c0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_12/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does Ava think Ella thinks Mila thinks William thinks the melon is? +Answer: green_box +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..30dafd88899ea4098ec6a74fd007d6aa9d6055cc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_13/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where is the cabbage really? +Answer: blue_crate +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a8d8a1e9daa24f466fb9a9311ae671d62633c47e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_13/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Abigail really think the cabbage is? +Answer: green_crate +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1e6a0904549d7a33e404839a1497b082e83a7d57 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_13/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Nathan think Abigail thinks the cabbage is? +Answer: green_crate +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ed4268f3098f5fdece36b84da5a298f2b6897a38 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_13/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Amelia think Nathan thinks Abigail thinks the cabbage is? +Answer: green_envelope +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..22fd255ddab2a126b8762094b255b9b02888dd30 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_13/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Charlotte think Amelia thinks Nathan thinks Abigail thinks the cabbage is? +Answer: green_envelope +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..52f0a9b6a00d433fdd3ef777322a870a60d884ff --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_14/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where is the lime really? +Answer: green_envelope +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..774a7b0c6e8321b6c50f556ecd40ecac6fa9209e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_14/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Abigail really think the lime is? +Answer: green_envelope +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c4f9a1c2d7db02d0c4d4214c2f853bd10835ce5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_14/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Avery think Abigail thinks the lime is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1e5e640559e06058dc3340d3c29faebc946a7354 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_14/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Jack think Avery thinks Abigail thinks the lime is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0309e7f7a4abdb37fcc46ae0cbf3d79ec858c705 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_14/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Aiden think Jack thinks Avery thinks Abigail thinks the lime is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3fce68abae238ccc9579997f69e5810690c8f562 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_15/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where is the watermelon really? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..780995d91255e23be840bcb80de41cb2dbb6ee65 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_15/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Avery really think the watermelon is? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4389a7989343881379a3e0b1ee46e70aa38dca79 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_15/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Owen think Avery thinks the watermelon is? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..070bb37e9b2fba34cd76cb5806c13815e065848a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_15/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Ella think Owen thinks Avery thinks the watermelon is? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f99dc784b4bb72a120fe6e6a0688ef3096e00747 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_15/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Amelia think Ella thinks Owen thinks Avery thinks the watermelon is? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5321e366c88b2faa95e4874af0c7e5d49acbe6db --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_16/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where is the carrot really? +Answer: red_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..24cd566ce660c55b243267775d7302799b3a5da1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_16/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does William really think the carrot is? +Answer: blue_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..cfde55cd775fce9c051823447ccbdcedadddf3b2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_16/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does Evelyn think William thinks the carrot is? +Answer: blue_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..61fbb31b355967ea33e7de422fed41014e599dc5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_16/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does Logan think Evelyn thinks William thinks the carrot is? +Answer: blue_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..071f80089aba66a180f40bf8d984495e405cbb75 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_16/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does Alexander think Logan thinks Evelyn thinks William thinks the carrot is? +Answer: blue_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..bd81074e0cc15502613221057051fa412a12c471 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_17/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where is the lettuce really? +Answer: blue_container +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1efd1a2462e6b06d2186e62e33f38f8b20ed2f2a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_17/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Liam really think the lettuce is? +Answer: blue_crate +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5230b8cd247cbe00bbacbdc8698f8a25fd70464b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_17/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Emma think Liam thinks the lettuce is? +Answer: blue_crate +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..453e5c3efb2a56ed4ecbb0bea0a9d4990a1bc317 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_17/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Mila think Emma thinks Liam thinks the lettuce is? +Answer: blue_crate +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8b250945700e19a463b235edcb4d4f76c50e8211 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_17/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Avery think Mila thinks Emma thinks Liam thinks the lettuce is? +Answer: blue_crate +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..002b2e4a05b30ea6cd773ab1310bfd5edd69d368 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_18/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where is the corn really? +Answer: green_crate +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3dc52c154519d91ff2d92664592d67a919bdadd5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_18/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Benjamin really think the corn is? +Answer: green_crate +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..31281c9130ec9b6d93fe1d2b9f16843679c910ec --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_18/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Jackson think Benjamin thinks the corn is? +Answer: blue_treasure_chest +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..0333474c010bd7b252d057235e7ed6484785d70a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_18/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Liam think Jackson thinks Benjamin thinks the corn is? +Answer: blue_treasure_chest +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..43ad1c415dd984cf65a581eb51c703061e88c672 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_18/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Charlotte think Liam thinks Jackson thinks Benjamin thinks the corn is? +Answer: blue_treasure_chest +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e70d6db181c690d5192585028780810e3cfda87c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_19/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where is the asparagus really? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8db2c71dfbdbcf9bc3ea6d7053768c4a89e626bf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_19/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Emily really think the asparagus is? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f145d74e6b9f0d4eab1c0e3239273415c59d66b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_19/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Hannah think Emily thinks the asparagus is? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9c50645f45ca5ff0f7acb96ec9ea3c32e408a4c1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_19/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Amelia think Hannah thinks Emily thinks the asparagus is? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a977eed47cdb2b6d7c3b96d2f5ab3a230e120f34 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_19/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Abigail think Amelia thinks Hannah thinks Emily thinks the asparagus is? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..338dc1718024bfacb81004b92a1a940e850c299a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_2/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where is the tomato really? +Answer: blue_container +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fa39774538a00bb9a8ca454d04a6dc79fc035d3e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_2/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Jacob really think the tomato is? +Answer: blue_container +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..287c19e82fd1d49487967a3545d187a0bc0b835b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_2/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Hannah think Jacob thinks the tomato is? +Answer: blue_container +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..aa4c9db7c1eb45de7ef1c83b2623e47d82755629 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_2/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Isabella think Hannah thinks Jacob thinks the tomato is? +Answer: green_box +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +*** \ No newline at end of file diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..dbd7b9ee925bb4321cc5468dc6e8da00681ab9c5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_2/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Elizabeth think Isabella thinks Hannah thinks Jacob thinks the tomato is? +Answer: green_box +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +*** \ No newline at end of file diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0c9d25cce045f5948129c3d68f9768b34dc27039 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_20/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where is the watermelon really? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f44f14cef290821d5f158b7c9cc32e9ee9c25c46 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_20/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Ava really think the watermelon is? +Answer: green_bottle +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..864a6c09f667c76123aaca472c697d4e5515531d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_20/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Jacob think Ava thinks the watermelon is? +Answer: green_bottle +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a1bacc48b92cca91eb089a036ba16c41aef38e50 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_20/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Emily think Jacob thinks Ava thinks the watermelon is? +Answer: green_bottle +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..bcf2bc9488a2a96ae39a04604e9b0b6aad75d61e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_20/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Evelyn think Emily thinks Jacob thinks Ava thinks the watermelon is? +Answer: green_bottle +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..597af8116a3d9e60b5972db591003f611070d07f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_3/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where is the eggplant really? +Answer: green_envelope +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..bb2842cc03ce423d087b0cb5667ad36159bb3353 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_3/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Noah really think the eggplant is? +Answer: green_envelope +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..303ab847b2af905c378dc896adf1e6086f27d895 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_3/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Hannah think Noah thinks the eggplant is? +Answer: blue_cupboard +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +*** \ No newline at end of file diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..20ac61363b39fafe3e2624032a18056fa27a3742 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_3/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Jack think Hannah thinks Noah thinks the eggplant is? +Answer: green_bathtub +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +*** \ No newline at end of file diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0a33261b0e7bd5d7c40fc8631effee6e6441148f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_3/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Owen think Jack thinks Hannah thinks Noah thinks the eggplant is? +Answer: green_bathtub +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. \ No newline at end of file diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7351bf647fe41cd05b88517154aea93ab457b597 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_4/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where is the spinach really? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..acf64df8688905592afc8928b66282bcb76654c9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_4/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Noah really think the spinach is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3c20cc3e5af51e65b1b78bfcc751956654fb6922 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_4/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Mila think Noah thinks the spinach is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c4b7c428737c8b781358087437813bb33b0a098d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_4/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Emily think Mila thinks Noah thinks the spinach is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..00b1149b69ab652d8956eb150982d9f12ca212d7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_4/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Evelyn think Emily thinks Mila thinks Noah thinks the spinach is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2c4183cb16fcf9df3b9d11f021a72f6ecc79d260 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_5/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where is the potato really? +Answer: red_bottle +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..155e77870ee2c7c854b2dca4f2f57b8364509a90 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_5/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Logan really think the potato is? +Answer: green_envelope +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1728b56705eb87a52efbde1fb2d5bcf307643ac5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_5/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Benjamin think Logan thinks the potato is? +Answer: green_envelope +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ac4aa52b69d03fd341c6f165dcc3c5cf5a9bebaa --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_5/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Charlotte think Benjamin thinks Logan thinks the potato is? +Answer: green_envelope +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..86d86f4d8e059a8967def0b782bb621506bda64d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_5/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Hannah think Charlotte thinks Benjamin thinks Logan thinks the potato is? +Answer: green_envelope +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9c6c8cb72da315335aab408f6c4c065ba87e67c6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_6/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where is the apple really? +Answer: red_box +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f46df0434b4a31f8323e8303ff3681ca211af045 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_6/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Lily really think the apple is? +Answer: red_box +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6a0683a2ac4dc543864091944c4760126d73f634 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_6/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Hannah think Lily thinks the apple is? +Answer: blue_cupboard +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..71dfa74bc966a3b88116d050f79fb150ee24d61c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_6/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Jack think Hannah thinks Lily thinks the apple is? +Answer: blue_cupboard +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..01f4d06bd35b30847ff1274d933c96898a5dbe67 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_6/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Aiden think Jack thinks Hannah thinks Lily thinks the apple is? +Answer: blue_cupboard +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..912f86b997e9342000501c0bf0964e718650a759 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_7/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where is the spinach really? +Answer: green_envelope +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9ba21acb1151e90359ff243ba8f0fbc4608f1dfd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_7/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Emma really think the spinach is? +Answer: green_envelope +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..54196069039023811b30f96db73e9fbd06d3c882 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_7/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Ella think Emma thinks the spinach is? +Answer: green_basket +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7a12e355e61fbd3c71483a7ac43a9a73cfbf8b4a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_7/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Aiden think Ella thinks Emma thinks the spinach is? +Answer: green_basket +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b2070a00523156a57bd46dcbd76c20e4732722f9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_7/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Benjamin think Aiden thinks Ella thinks Emma thinks the spinach is? +Answer: green_basket +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..296dab705425af72918b259463a6a2667c812004 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_8/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where is the corn really? +Answer: blue_suitcase +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e4f1fa8977103cfdbb36d130ce430770b9e0b8f8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_8/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Sophia really think the corn is? +Answer: blue_suitcase +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a914b9f555a7977bf81b8df51dd64fffbb7dcbab --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_8/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Chloe think Sophia thinks the corn is? +Answer: green_crate +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..36e8d98ef62ec86557db5c02e6f7e6af4b47b7a9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_8/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Ella think Chloe thinks Sophia thinks the corn is? +Answer: green_crate +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7cfc906d78ef115f68c8c9cf548f6c784a9b0bf5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_8/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Owen think Ella thinks Chloe thinks Sophia thinks the corn is? +Answer: green_crate +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e9b33d2aebf68b2e7d1838dfed0ec9778817c8ea --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_9/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where is the banana really? +Answer: green_envelope +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b1954096110fe19980959b539638c89aa6b07b5c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_9/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Abigail really think the banana is? +Answer: blue_bottle +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..43e19f2e2d7ce5babc16e84dbc3d3d14673ea768 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_9/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Ella think Abigail thinks the banana is? +Answer: blue_bottle +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..83b216e40bd0a5aa36b58e359f100ebe80115faf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_9/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Elizabeth think Ella thinks Abigail thinks the banana is? +Answer: green_envelope +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..cfa0be40511041e90023baeda09f6451dc68c37e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_1/sample_9/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Owen think Elizabeth thinks Ella thinks Abigail thinks the banana is? +Answer: green_envelope +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5d790941d007aae8e2ccfa6afd6e97bb27f7a528 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_1/order_0.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where is the cucumber really? +Answer: green_treasure_chest +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c3df57e211c6541dba0716ee4990f630c021569 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_1/order_1.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Evelyn really think the cucumber is? +Answer: red_envelope +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..bd1bdbc8a9b2cd40c8e96f8e6a12e2a060f5dba6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_1/order_2.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Ava think Evelyn thinks the cucumber is? +Answer: green_treasure_chest +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f15e25678dffd066bcd29824ebe74ab8c8c7e2e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_1/order_3.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Charlotte think Ava thinks Evelyn thinks the cucumber is? +Answer: green_treasure_chest +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4691038395199ed8df985b368318aedc3ec1cbc5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_1/order_4.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Jacob think Charlotte thinks Ava thinks Evelyn thinks the cucumber is? +Answer: green_treasure_chest +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7a7f513a434dc12c5968fad2e5028e76a244b47c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_10/order_0.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where is the orange really? +Answer: red_container +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ae4c733617dca9e7d2301823225587cc1670d781 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_10/order_1.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Hannah really think the orange is? +Answer: red_pantry +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..0912a4b765dd03bc0b3df565f8d7a5d1a2e71e6a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_10/order_2.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Aiden think Hannah thinks the orange is? +Answer: red_pantry +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1a55486e3e896cb8b433127277600180fe41db98 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_10/order_3.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Jack think Aiden thinks Hannah thinks the orange is? +Answer: red_pantry +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..fd23afbf244725f7657ffc9b3d9ad019858eb5d9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_10/order_4.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Alexander think Jack thinks Aiden thinks Hannah thinks the orange is? +Answer: red_pantry +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9783bd2a5bbfa4354e38a1afc2c3a9ee12ca4829 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_11/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where is the cherry really? +Answer: blue_suitcase +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..610bd2c7dbe45a7f4c1ce0796ffe0000686617c1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_11/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Avery really think the cherry is? +Answer: blue_suitcase +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c2b78739eb219d03466d1d6235cfff1dcb497387 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_11/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Lily think Avery thinks the cherry is? +Answer: red_container +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..78b2c6b455305f9b94aef2fe3a36233ca08f287b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_11/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Ella think Lily thinks Avery thinks the cherry is? +Answer: red_container +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b520e526508092c8583dd70dd5cef16431da7d75 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_11/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Emily think Ella thinks Lily thinks Avery thinks the cherry is? +Answer: red_container +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..579ef6792f234852deb76027515c6b33f77dba39 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_12/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where is the pear really? +Answer: red_bucket +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..95aa1825d109813234f5496b15adecef43d2bef7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_12/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does Charlotte really think the pear is? +Answer: red_bucket +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..05d1b1d2ed72a42eaab0753a2565abee68d0b741 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_12/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does Alexander think Charlotte thinks the pear is? +Answer: red_bucket +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..73821e755e65380dcd2197457232366386b32e82 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_12/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does Ava think Alexander thinks Charlotte thinks the pear is? +Answer: red_box +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b98bd13d1a4ccc92664a9f2b7d587b08ccac844f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_12/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does William think Ava thinks Alexander thinks Charlotte thinks the pear is? +Answer: red_box +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..266a13050d602ff337917844d1c110fc33d11efa --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_13/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where is the watermelon really? +Answer: green_basket +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cdcb31efb8517c70a5c45338cf1502f42b52035c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_13/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Carter really think the watermelon is? +Answer: green_basket +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..88245525b79d61ca14dad5910e2500c19e7326b4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_13/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Avery think Carter thinks the watermelon is? +Answer: blue_suitcase +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e1b2a5975c1bee5b41816b43e247c7445e230d7f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_13/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Isla think Avery thinks Carter thinks the watermelon is? +Answer: blue_suitcase +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..27280c02312b8718fe8c9faac5f399081f507f94 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_13/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Sophia think Isla thinks Avery thinks Carter thinks the watermelon is? +Answer: blue_suitcase +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ea5ef8decee9647cd3ffe42a87ff4a1ea65d0ab3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_14/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where is the lemon really? +Answer: green_bottle +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..db8fb77699a74f318f82109b48ceda3a53670e8d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_14/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Isla really think the lemon is? +Answer: red_container +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..710be04d09b82b243eaa751eb9afed3968d0be30 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_14/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Sophia think Isla thinks the lemon is? +Answer: red_container +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d3e17bd0a741f018c383ac591ea1cfa477fcb39b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_14/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Evelyn think Sophia thinks Isla thinks the lemon is? +Answer: red_container +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..cdcd2403fea0828baab7c3cc2d7f4abfb5062502 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_14/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Alexander think Evelyn thinks Sophia thinks Isla thinks the lemon is? +Answer: red_container +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..49c37651a40b8d9b197ddc3a42d913a83e02d4c4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_15/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where is the corn really? +Answer: green_bucket +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..231c30d61279f2a6d0d4bbe74e44d9bcc13a30cc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_15/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Abigail really think the corn is? +Answer: green_bucket +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2c16dd5c1769b24cdf05871ae6c32c10a81feeac --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_15/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Nathan think Abigail thinks the corn is? +Answer: green_bathtub +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..765f654aaf10ac32f2c211caa15359cd4da355fc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_15/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Avery think Nathan thinks Abigail thinks the corn is? +Answer: green_bathtub +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6490faf679e3c1d2e4ee6b03773fc6279037a5cc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_15/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Hannah think Avery thinks Nathan thinks Abigail thinks the corn is? +Answer: green_bathtub +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2e364f39663c43bb90036216502148212365559b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_16/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where is the tangerine really? +Answer: green_bottle +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..798bc6e453d5876429229d24dce0f27884e802f4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_16/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Benjamin really think the tangerine is? +Answer: red_bucket +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8c2a40cf2b1dad86cb6f2f2ba82bda363fa34342 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_16/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Liam think Benjamin thinks the tangerine is? +Answer: blue_treasure_chest +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f16c7300804d6af8ab6ae14af5aa74ffebe58b2a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_16/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Carter think Liam thinks Benjamin thinks the tangerine is? +Answer: blue_treasure_chest +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c113b9450c57ef627772ca30c619c79fa480fc66 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_16/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Jackson think Carter thinks Liam thinks Benjamin thinks the tangerine is? +Answer: blue_treasure_chest +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b0d3d7b7abcbd25a4c0118e9bb7898790efcc6af --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_17/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where is the lime really? +Answer: green_pantry +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..91234e6f376c2ea54c9ef2418ff6570eb61c2267 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_17/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Owen really think the lime is? +Answer: blue_drawer +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..051325f9e0037aced72e09eda1afa27311011026 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_17/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Emily think Owen thinks the lime is? +Answer: blue_drawer +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..57a27b585d6f5dbe975503fb1f1d8bbd3b7c4f0b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_17/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Lily think Emily thinks Owen thinks the lime is? +Answer: blue_drawer +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8df57c1b39079ad0880ae224dbe5c97731058721 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_17/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Ella think Lily thinks Emily thinks Owen thinks the lime is? +Answer: blue_drawer +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..adc72f79a810580c9d7a6d06a0a5e9b1a41eb124 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_18/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where is the corn really? +Answer: blue_container +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f834ad0987483b93b12b93f9c8092ae995c18070 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_18/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Noah really think the corn is? +Answer: blue_treasure_chest +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a68d15ca4d57ebeafa089a1d7726a2dd91257f21 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_18/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Lily think Noah thinks the corn is? +Answer: blue_treasure_chest +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d36c2b91e17a1cf09a92b81f6322c1ab77729f5c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_18/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Isla think Lily thinks Noah thinks the corn is? +Answer: blue_treasure_chest +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c3c2f6565c74c417cfd2300b991af21f2b0af78c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_18/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Mila think Isla thinks Lily thinks Noah thinks the corn is? +Answer: blue_treasure_chest +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e48356ad27463e271880905e189c6dddc6f08dd1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_19/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where is the tomato really? +Answer: blue_container +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..dc9be7dfe7c9aafe84551d17108d883a6a8efc04 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_19/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Jackson really think the tomato is? +Answer: blue_crate +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c6d6bdf55b0ed6aceeade91a6e569ee364d32a77 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_19/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Nathan think Jackson thinks the tomato is? +Answer: blue_crate +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d4d75c69e509436e70a6884e679ce783c7a16ea4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_19/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Amelia think Nathan thinks Jackson thinks the tomato is? +Answer: blue_crate +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b5d7feea6df4221269dab7418704b545e8b0a9f3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_19/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Sophia think Amelia thinks Nathan thinks Jackson thinks the tomato is? +Answer: blue_cupboard +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..95cbbf70b0e00974741f8b01ec073390301d0d9f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_2/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where is the corn really? +Answer: red_basket +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..45840793bc856682ac0f34fe69348225e0fb018f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_2/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Amelia really think the corn is? +Answer: red_basket +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6e19e7bbfb665fd1b701f881c0c7821878aba4f0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_2/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Lily think Amelia thinks the corn is? +Answer: red_container +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..36f0ca879c91c54b44c9c2af214c38960b63914c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_2/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Sophia think Lily thinks Amelia thinks the corn is? +Answer: red_container +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1a3436d9e703b50d081b70294ea0b1687cd12e02 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_2/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Liam think Sophia thinks Lily thinks Amelia thinks the corn is? +Answer: red_container +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1de433cf02f318915f6b38962d8282dadb11a35e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_20/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where is the peas really? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..bcb77a32ec5a6ebd702e37756ab98c09d2164165 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_20/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Nathan really think the peas is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..af607c060f0a7267f8920aa05eda8637ef7a12ff --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_20/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Emily think Nathan thinks the peas is? +Answer: red_basket +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..312e8081a28417a31d6cc0ace362f39cd52af32f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_20/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Ella think Emily thinks Nathan thinks the peas is? +Answer: red_basket +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..87c299061efb21ec44d6111bc743447f75865253 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_20/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Evelyn think Ella thinks Emily thinks Nathan thinks the peas is? +Answer: red_basket +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ce219afdd92f948c10f9f9a06910d2a5eb91d8dd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_3/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where is the peas really? +Answer: blue_crate +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..924076b7036ad9ab778bfc9a2c8bb4955ecdb15b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_3/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Benjamin really think the peas is? +Answer: blue_crate +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c9e8ade1e4bbde55fa436921cdb5a5ffaf0d555 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_3/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Noah think Benjamin thinks the peas is? +Answer: green_crate +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8a168b8c20e5796349344a3558bae94a83dc17d9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_3/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Liam think Noah thinks Benjamin thinks the peas is? +Answer: blue_container +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..79b36dace36e569c56dae8b459665d16baf525df --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_3/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Avery think Liam thinks Noah thinks Benjamin thinks the peas is? +Answer: blue_container +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7795546323728f13bf2a7fca9ebb429698c9fd82 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_4/order_0.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where is the potato really? +Answer: blue_drawer +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ef20adfe91122cfbf3a837664782fc253b88317c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_4/order_1.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Isabella really think the potato is? +Answer: green_bottle +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b18581d7f457b8e3dbfe7ef22a49bf3470efe2e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_4/order_2.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Chloe think Isabella thinks the potato is? +Answer: blue_drawer +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..432d6b87dfa6ace9d85bc32e3b3414b50bde6b32 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_4/order_3.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Evelyn think Chloe thinks Isabella thinks the potato is? +Answer: blue_drawer +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6e403c6d8667977c9ca5c331a2a9c9791281649d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_4/order_4.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Jacob think Evelyn thinks Chloe thinks Isabella thinks the potato is? +Answer: blue_drawer +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..140145e83f30bb908799185cbc4ccb77d4cfe828 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_5/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where is the cabbage really? +Answer: green_envelope +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f1a5557945563d295c73eb62b45c1fb19881436b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_5/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Avery really think the cabbage is? +Answer: green_envelope +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f2013d375ffe5531c12b5d4ab77023626c2b0ee3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_5/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Aiden think Avery thinks the cabbage is? +Answer: green_box +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..572cdb4d87b0cc2278aec4551863170d04af7380 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_5/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Emma think Aiden thinks Avery thinks the cabbage is? +Answer: green_box +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1d777407b383b52d96c07394fcfe5369d581481e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_5/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Noah think Emma thinks Aiden thinks Avery thinks the cabbage is? +Answer: green_box +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f2adeb575211926083a3e4aab622cea8cb294dbc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_6/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where is the melon really? +Answer: red_pantry +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b6993a5e4688895279ed01e8a4e45e94ba4fa9ce --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_6/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Owen really think the melon is? +Answer: green_basket +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c860bdd749a5cbc40f0811322a701c93ca2f93d5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_6/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Avery think Owen thinks the melon is? +Answer: green_basket +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9966de746d4b7e8815f99c77914af9a3a885a865 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_6/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Benjamin think Avery thinks Owen thinks the melon is? +Answer: green_basket +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b44cca544fc1703355fb5388e7cf21b87d73cc0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_6/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Noah think Benjamin thinks Avery thinks Owen thinks the melon is? +Answer: green_basket +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b57611341751625b8fd3810090827980cac9cf82 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_7/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where is the melon really? +Answer: blue_treasure_chest +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b9492775f76aa42128fcef7db5119618906fe92c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_7/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Nathan really think the melon is? +Answer: blue_treasure_chest +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5b00c9c58624c73d56a798012295c6effa3ee70e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_7/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Lily think Nathan thinks the melon is? +Answer: blue_treasure_chest +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f6265c7f2dcb69c6417b9497c7bac8eb1bb9b4b8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_7/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Isabella think Lily thinks Nathan thinks the melon is? +Answer: green_treasure_chest +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..acd73d93bef72f3856c96f966a7dca11b442f719 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_7/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Ava think Isabella thinks Lily thinks Nathan thinks the melon is? +Answer: green_treasure_chest +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5ade772882e71f2d7b20fd26296d2eb05e33a39 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_8/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where is the watermelon really? +Answer: blue_treasure_chest +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fc86ad5c52d5daf850e8434b2fc5755fea2fe180 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_8/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Noah really think the watermelon is? +Answer: blue_treasure_chest +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5a9a77b26370e9cf3fb00a80f49310a650f53dae --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_8/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Emma think Noah thinks the watermelon is? +Answer: green_bucket +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..914e87debe63fedf5af3683453431a94838f116f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_8/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Liam think Emma thinks Noah thinks the watermelon is? +Answer: green_bucket +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4cf513a1a32c65cd87741bf508c11fbee7b8b303 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_8/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Owen think Liam thinks Emma thinks Noah thinks the watermelon is? +Answer: green_bucket +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8f11d087afb0f775f58b78ad748dabd121c803d0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_9/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where is the carrot really? +Answer: red_basket +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0a84fe655f6d748ca66019ac6c7d83a1c9be5f7a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_9/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Noah really think the carrot is? +Answer: red_basket +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..cf1da1bb4a8928af70789514970e44bdfba69b66 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_9/order_2.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Owen think Noah thinks the carrot is? +Answer: green_drawer +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f054825efcb90f7f83a982181297433e293abb38 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_9/order_3.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Mila think Owen thinks Noah thinks the carrot is? +Answer: red_pantry +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d1c4553ca217a3f6506fbe248ed25d5532bc1bdb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_2/sample_9/order_4.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Lily think Mila thinks Owen thinks Noah thinks the carrot is? +Answer: red_pantry +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3fd16fda3c30a1f41582db42bf3b50a998182e24 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_1/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where is the lettuce really? +Answer: blue_container +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ff87f22e4bca347b5aaa2e941929f98e2bac07dd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_1/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Isabella really think the lettuce is? +Answer: blue_container +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3eaf0a6ad080836fedbcaedc3366559085695901 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_1/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Abigail think Isabella thinks the lettuce is? +Answer: red_basket +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..be65e820980df3208f13497d5952bf0dabfbfb5f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_1/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Nathan think Abigail thinks Isabella thinks the lettuce is? +Answer: green_cupboard +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..511a2905b5785ddd7f3c3486587b06f9bff5d053 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_1/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Logan think Nathan thinks Abigail thinks Isabella thinks the lettuce is? +Answer: green_cupboard +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1b218e7d1bcee2bbf22e08727f13322a9d01289f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_10/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where is the sweet_potato really? +Answer: red_container +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..313a698af415bd0544497bfda543d8dcdff26d42 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_10/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does Evelyn really think the sweet_potato is? +Answer: blue_cupboard +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..55b8ba29df478109a3e00f41d351b3d90f6a25db --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_10/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does Logan think Evelyn thinks the sweet_potato is? +Answer: red_container +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..fefaedc1f04799f0fb3474f39149ff45cb686430 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_10/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does Charlotte think Logan thinks Evelyn thinks the sweet_potato is? +Answer: red_container +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..164251b54ad6f7e0b178dbf58514969f82d4134f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_10/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does William think Charlotte thinks Logan thinks Evelyn thinks the sweet_potato is? +Answer: red_container +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8cd98d7b83f020a07284da6e0cd521b03e2a8eb2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_11/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where is the melon really? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..90b371506c27aaf28fc4159ab8f7c3c42ab7c22d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_11/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does William really think the melon is? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ebf9a210f04e2de450829b327d938302f3ebf02a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_11/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does Lily think William thinks the melon is? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d31fbe4eb837443ec71d1392df5573156b1848af --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_11/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does Emma think Lily thinks William thinks the melon is? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..141cef7049389470e66abcf6373ff97de3b58297 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_11/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does Isla think Emma thinks Lily thinks William thinks the melon is? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..41d71250f1b020385db9a0e111b84b097d037f23 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_12/order_0.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where is the beans really? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..629b2ae699b43a6a26b6ba4a7010d141d7b3548d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_12/order_1.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Jack really think the beans is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c1a8021f2df483742bc3ae53b600643aa802355a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_12/order_2.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Owen think Jack thinks the beans is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..44db0daaaf3e8fa7cfa80889f600396d0bc5fe1b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_12/order_3.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Liam think Owen thinks Jack thinks the beans is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..85258a96b9d5375c246194141c295f75422f4ee9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_12/order_4.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Benjamin think Liam thinks Owen thinks Jack thinks the beans is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f01f0eb97fb46a9b4bdc601d4884d865669ce2fa --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_13/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where is the corn really? +Answer: green_bottle +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..84dfc9a147944c61a4e985fa4c5ad9febb08855e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_13/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does William really think the corn is? +Answer: green_bathtub +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ec525779ba697ba5ad2f27379d1d2b9bfefa93c9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_13/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does Emily think William thinks the corn is? +Answer: green_bathtub +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a80405f497a4cbc940f93f4a74eeed0654a3a509 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_13/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does Emma think Emily thinks William thinks the corn is? +Answer: green_bathtub +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..12e4fbef8b07cb571a339033766dec734c38e657 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_13/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does Jackson think Emma thinks Emily thinks William thinks the corn is? +Answer: green_bathtub +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5d0ad5d81cfbbb441a1409dd8dabadd3f72984ed --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_14/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where is the cucumber really? +Answer: red_pantry +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c247826568f5f2b15c298337572d6afde48702af --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_14/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Avery really think the cucumber is? +Answer: red_pantry +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4058013d442ec486fa07e7792f3ecf1d298f5a4e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_14/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Abigail think Avery thinks the cucumber is? +Answer: blue_container +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..0a9e40e2511fdc07db71b4d0f8d4a8cf8e8d1229 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_14/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Hannah think Abigail thinks Avery thinks the cucumber is? +Answer: blue_container +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f855d5eaefd58dc054105007ea64dbfa2321a46e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_14/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Owen think Hannah thinks Abigail thinks Avery thinks the cucumber is? +Answer: blue_container +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c51bdb584852bb05a0c73e1556f30495daf06f84 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_15/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where is the sweet_potato really? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..710b191235df534bfb4060479a7e42880ef258d8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_15/order_1.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Jacob really think the sweet_potato is? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..64855c34c3905a4228a1bba528e116006c57f51a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_15/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Aiden think Jacob thinks the sweet_potato is? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..3ab01fa777dc83a6298e9737fb166ed0ccafaafe --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_15/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Mila think Aiden thinks Jacob thinks the sweet_potato is? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0989d4b70a152eee60508238d0df66642471838b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_15/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Elizabeth think Mila thinks Aiden thinks Jacob thinks the sweet_potato is? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..04b42e5c727403d6fb1a0b95aaf112c5e7f4d677 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_16/order_0.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where is the persimmon really? +Answer: red_basket +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1bb0704f4994361831d28fb452ecf9600750ce1b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_16/order_1.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does William really think the persimmon is? +Answer: red_basket +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4356ba09c632821f338f1f96b8e259fc302e001c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_16/order_2.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does Hannah think William thinks the persimmon is? +Answer: blue_crate +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8999d6ad0fcaff1828dbaadc3e7622aaa9564e1e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_16/order_3.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does Avery think Hannah thinks William thinks the persimmon is? +Answer: blue_crate +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..475ff743b4627177f7c9f78aac926769d3401abc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_16/order_4.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does Alexander think Avery thinks Hannah thinks William thinks the persimmon is? +Answer: blue_crate +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..986583fe65e06e382935723bbee25f40d30c6bf4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_17/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where is the eggplant really? +Answer: green_pantry +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..bb389f5c4a5691725db504bb1a6014aa3baa6b2e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_17/order_1.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Emma really think the eggplant is? +Answer: green_pantry +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..73985040f2f4cec88a9c01f8233e374ae475a95c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_17/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Jackson think Emma thinks the eggplant is? +Answer: green_box +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..bfa553cf5baab0e18b06c216dab625db176a7178 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_17/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Jack think Jackson thinks Emma thinks the eggplant is? +Answer: green_box +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..08c77afcbb0679dead88ae57d34e89877a20cdfb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_17/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Emily think Jack thinks Jackson thinks Emma thinks the eggplant is? +Answer: green_box +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d6f97d0d966b3acf4e56fa7b090cd20f4be6a92b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_18/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where is the lime really? +Answer: blue_crate +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2f05ab2c4bc0dded9e6936a5a7b648ad5228f080 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_18/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Elizabeth really think the lime is? +Answer: green_pantry +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f23336b2e75a40dddd4fea673c561e3ed19f53ed --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_18/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Alexander think Elizabeth thinks the lime is? +Answer: green_pantry +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..82d6dd60385bc1879036523e27bbae6c44f87385 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_18/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Owen think Alexander thinks Elizabeth thinks the lime is? +Answer: green_pantry +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..53e3b8193894488fc98c98e13be8c33526dd9774 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_18/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Nathan think Owen thinks Alexander thinks Elizabeth thinks the lime is? +Answer: green_pantry +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7aae8f7d16ccca735fae68f52f14b0d7a65f0497 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_19/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where is the pear really? +Answer: blue_crate +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..480abb8ad29d945b44afc043daffdd8e1af8f251 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_19/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does Noah really think the pear is? +Answer: blue_crate +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..39db33d57a9f83807f0bfd3d8761afa3af1e137e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_19/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does William think Noah thinks the pear is? +Answer: green_crate +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..01163a19f97c54cb85b491972026270b10eae1b6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_19/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does Isabella think William thinks Noah thinks the pear is? +Answer: blue_crate +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..258093bad06b3d04104c284659cdfb352c7ac08f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_19/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does Aiden think Isabella thinks William thinks Noah thinks the pear is? +Answer: blue_crate +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..573eb3442cff5c59623032a7c15518c25c483c78 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_2/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where is the onion really? +Answer: blue_bottle +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8ec162fb18645af4502f965fc9090fb9974dd121 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_2/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Nathan really think the onion is? +Answer: blue_bottle +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..05b14eaa6841783bc57156dedff161eaace60d92 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_2/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Emily think Nathan thinks the onion is? +Answer: blue_container +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cb3871e4fc4fa928a751193866d9bd1f64eba893 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_2/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Owen think Emily thinks Nathan thinks the onion is? +Answer: blue_container +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..cae986f7a5dc14e9059b399dee6d9085934d8cdb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_2/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Liam think Owen thinks Emily thinks Nathan thinks the onion is? +Answer: blue_container +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..57056dd2802d03a50d8073ea46535d86d4bb4b20 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_20/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where is the spinach really? +Answer: blue_treasure_chest +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..30d0c65ae66996396d8f7f59d19fc0c0300ffcec --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_20/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Evelyn really think the spinach is? +Answer: blue_treasure_chest +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..53aaa1eda2f884481f6e11d042d6a0a73f5a2f35 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_20/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Jackson think Evelyn thinks the spinach is? +Answer: green_cupboard +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..dd8981d705872f07dc27858819981deb28e2b4cf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_20/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Liam think Jackson thinks Evelyn thinks the spinach is? +Answer: green_drawer +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0c9917ecb22c77d51307d636a81321f57cf43b62 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_20/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Elizabeth think Liam thinks Jackson thinks Evelyn thinks the spinach is? +Answer: green_drawer +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..09f92f6ae865ff17f63713457e5fe62243f28c79 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_3/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where is the peas really? +Answer: blue_cupboard +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ecad6db5bca9fb79167e4f434ad220e494663ab7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_3/order_1.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Isla really think the peas is? +Answer: blue_cupboard +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..577a65af4ee71b9ab745de770c4d90123615cb61 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_3/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Amelia think Isla thinks the peas is? +Answer: green_bucket +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b7be13373e565f06b20a39833a9270790a7db5c1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_3/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Carter think Amelia thinks Isla thinks the peas is? +Answer: green_bucket +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3c259d7fb1326eafd5a2fe4100e230414a1307da --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_3/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Mila think Carter thinks Amelia thinks Isla thinks the peas is? +Answer: blue_bucket +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9ee297f009ddb2511abb1049475a9d431f2551a8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_4/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where is the green_pepper really? +Answer: blue_container +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8d19ba957d7b4d744fd2b95ca1d1a07efccce071 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_4/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Emma really think the green_pepper is? +Answer: blue_container +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..edaab4f633c7afd755efa30b1ae8cd467c235793 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_4/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Benjamin think Emma thinks the green_pepper is? +Answer: blue_container +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..711538799bd75a7a00c448ba3bd48b9d22e8bc44 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_4/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Jackson think Benjamin thinks Emma thinks the green_pepper is? +Answer: blue_container +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b4c1e52d18b90a5729d051a5c7c6c3e81674dfc6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_4/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Abigail think Jackson thinks Benjamin thinks Emma thinks the green_pepper is? +Answer: blue_container +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fc1ee8b06ed8ac421543e278ce284ff797cea56e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_5/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where is the peas really? +Answer: blue_bathtub +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9cfd5f8cace61f5a3ede745c31008c2004b0f29f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_5/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Hannah really think the peas is? +Answer: blue_bathtub +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1ed5c78215da5ccb66bdb48de8a4915e93becbf2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_5/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Amelia think Hannah thinks the peas is? +Answer: green_basket +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..385644af57a7aa16f4046c3549a48b458cd32b5f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_5/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Jackson think Amelia thinks Hannah thinks the peas is? +Answer: green_basket +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..33452e2e32c764cc2b5cae9c7a00730e093d464d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_5/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Abigail think Jackson thinks Amelia thinks Hannah thinks the peas is? +Answer: green_basket +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f15c5e7f644288471bf380e5dc0d5b99b4dddd0f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_6/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where is the turnip really? +Answer: blue_pantry +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..433202c35efb936468337b3551cc6fe5e42e6a2f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_6/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Hannah really think the turnip is? +Answer: blue_pantry +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..89a555c179888f9b291a2dd343d35d12baf4d9e4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_6/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Lily think Hannah thinks the turnip is? +Answer: red_basket +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a6dd4b24f1768b29b39116ebdf91f3df08c6b0d8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_6/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Noah think Lily thinks Hannah thinks the turnip is? +Answer: red_basket +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1e2afcbfa04d9157023115864d9bb64192724f04 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_6/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Logan think Noah thinks Lily thinks Hannah thinks the turnip is? +Answer: green_drawer +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..504b8aeba3a1fcaa39001d083ab93e520ea765e7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_7/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where is the watermelon really? +Answer: red_bottle +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..72c96c6d3178c7f62eaea60461481974a1ad25e8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_7/order_1.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Evelyn really think the watermelon is? +Answer: green_cupboard +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..fa05d4f171d84c28d5bdd4a1f42e34bdfa52eb41 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_7/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Logan think Evelyn thinks the watermelon is? +Answer: green_cupboard +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d3d08a7c581944621c07916000bdab27ed616637 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_7/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Chloe think Logan thinks Evelyn thinks the watermelon is? +Answer: green_cupboard +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0518de0eaa1a95b092c5fb4c185175c255f2e0f9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_7/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Charlotte think Chloe thinks Logan thinks Evelyn thinks the watermelon is? +Answer: green_cupboard +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..91bbcfec9cfc9cd78b95e3fb37e3a3d84dd7350a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_8/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where is the lemon really? +Answer: green_drawer +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..46d3ec2bc11b9a57d712e98ec6940ba4d39c4677 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_8/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Aiden really think the lemon is? +Answer: green_basket +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3fe23f80bcaea16572ce0ff3b0841b38eaa222b2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_8/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Nathan think Aiden thinks the lemon is? +Answer: green_basket +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..425a976996d516d6a5100dacfb4db1bf8050e84f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_8/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Jack think Nathan thinks Aiden thinks the lemon is? +Answer: blue_pantry +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..74da87e0984fc0f2fa6a57502191b7df301d55b9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_8/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Liam think Jack thinks Nathan thinks Aiden thinks the lemon is? +Answer: blue_pantry +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d871d1806c795bb8506a8f02bb04cd3455b6e4ff --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_9/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where is the cabbage really? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8d4a2ca783d0bdd9bb4151b2dc4d6c4dc57ee36b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_9/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Isla really think the cabbage is? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..50a67ad88d1d06f27e7ce4d73675b9311eecb101 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_9/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Elizabeth think Isla thinks the cabbage is? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..edfc97e2bcd279df5dfb13a85bcaa8ea6f3b726c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_9/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Abigail think Elizabeth thinks Isla thinks the cabbage is? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..68d8608de99fdb77dceeb0b58073b0f614b09b6f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/CoT/length_3/sample_9/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Aiden think Abigail thinks Elizabeth thinks Isla thinks the cabbage is? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..df7bf1f66ec9e3f7440b1b8eedf28b5e9b6b8630 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_1/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where is the lettuce really? +Answer: green_drawer +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e11d28d832c73ed6919735ac506eb0f0fda3eb65 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_1/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Avery really think the lettuce is? +Answer: green_bathtub +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5c5cc7577f66cde242e579594f5bb5a36745db2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_1/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Charlotte think Avery thinks the lettuce is? +Answer: green_bathtub +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cf655989f9eb368fecd358f62e3b729814248bc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_1/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Owen think Charlotte thinks Avery thinks the lettuce is? +Answer: green_drawer +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..af946f1abd616d79b274ba31cfdff8b78141c07d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_1/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Isabella think Owen thinks Charlotte thinks Avery thinks the lettuce is? +Answer: green_drawer +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..08ab2900ebe7887d2c715d2054238197fb420d4a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_10/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where is the plum really? +Answer: red_pantry +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0150d41957dd210a52c0e5331066902359ad859e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_10/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does William really think the plum is? +Answer: green_bucket +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6e9cdc1d78fe6f1ffceeec639d98e62a42625fa9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_10/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does Nathan think William thinks the plum is? +Answer: red_pantry +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f4a5bb34fbd22c5a1b34b246133c86aaf8a9bcf2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_10/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does Evelyn think Nathan thinks William thinks the plum is? +Answer: red_pantry +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..75598ee803be68d9375b76048f147b8022947aaa --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_10/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does Jacob think Evelyn thinks Nathan thinks William thinks the plum is? +Answer: red_pantry +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0f2cb0fbe8d5eabb26415aeff9e3c5e95aac420c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_11/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where is the orange really? +Answer: red_box +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7965af473287dd584d793ee1baee8faec2a56452 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_11/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Ella really think the orange is? +Answer: red_envelope +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b383282f1c009f71168304f3a24a0265989100dd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_11/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Elizabeth think Ella thinks the orange is? +Answer: red_box +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2c028492fb832ed638622ebbf1562c3af44151bc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_11/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Chloe think Elizabeth thinks Ella thinks the orange is? +Answer: red_box +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d494e82d2427c7f91d6e66211fca913fd2ab30c7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_11/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Alexander think Chloe thinks Elizabeth thinks Ella thinks the orange is? +Answer: red_box +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f79d5ea1978d79635897d549278d957d56fcaf31 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_12/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where is the melon really? +Answer: red_bottle +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b69bb9e494156efc2c67181bca8c70e829e05110 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_12/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does William really think the melon is? +Answer: red_bottle +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..79ddd5c8221cce717b56c72aab3304fdb0b5dae1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_12/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does Mila think William thinks the melon is? +Answer: green_box +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..df350b8abacaf9758052ee9a622bed0058da7d2b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_12/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does Ella think Mila thinks William thinks the melon is? +Answer: green_box +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..883c0a37f489a6b2869cd50e2409a0e89469c393 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_12/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does Ava think Ella thinks Mila thinks William thinks the melon is? +Answer: green_box +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4b07f80fe86f23e3bca607d93dc8e8223e8bb379 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_13/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where is the cabbage really? +Answer: blue_crate +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..517c5f77f30befbf56f88c27d62f59109afc193a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_13/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Abigail really think the cabbage is? +Answer: green_crate +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a9ff01854a5648676c0dfed4089b4402c335e8b5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_13/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Nathan think Abigail thinks the cabbage is? +Answer: green_crate +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6e2f5c1588379f748b136b9c72ccd6909009435e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_13/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Amelia think Nathan thinks Abigail thinks the cabbage is? +Answer: red_container +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..019d40fa399607ad95879aff52e14304596a6f17 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_13/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Charlotte think Amelia thinks Nathan thinks Abigail thinks the cabbage is? +Answer: red_container +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..112b1c6838475707e5efcf194687008277c46195 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_14/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where is the lime really? +Answer: green_envelope +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b65a0296ce1f650f3123ae64fbc0ebaef58d9efb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_14/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Abigail really think the lime is? +Answer: green_envelope +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..de9135f50b55d1e55b55ece6c16309ae373edd6f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_14/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Avery think Abigail thinks the lime is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5321c1154f6580d36e000f586259ff7881269f9f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_14/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Jack think Avery thinks Abigail thinks the lime is? +Answer: blue_pantry +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ff6bf681b3145644ad068903feb0ef7da24f88e8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_14/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Aiden think Jack thinks Avery thinks Abigail thinks the lime is? +Answer: green_envelope +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..890fda18ef8d652cd247c1a96f4143ac2bdfb718 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_15/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where is the watermelon really? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..99bdfae12672d3e709ba885fc39b75bf37aff8f6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_15/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Avery really think the watermelon is? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2bd2bddfb26d09b5e655ccc3cb0c3c8ff5f9bc1d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_15/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Owen think Avery thinks the watermelon is? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a6909b1adc0a2d562fca7075784842118280e8cd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_15/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Ella think Owen thinks Avery thinks the watermelon is? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..edfc164697f1d01c61cf34affe4fc02970c7f4d0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_15/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Amelia think Ella thinks Owen thinks Avery thinks the watermelon is? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..80a883e4a8e2f046ab387409d8e7600b50f38a05 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_16/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where is the carrot really? +Answer: red_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..49f2b5868281b77b5049d6028a7e9e21a69ee0e9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_16/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does William really think the carrot is? +Answer: blue_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..69a52b01d094d94d0eb85649c492a850c08e5f95 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_16/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does Evelyn think William thinks the carrot is? +Answer: blue_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..29316b5611247c09886808a37a47ee0aaa5904d2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_16/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does Logan think Evelyn thinks William thinks the carrot is? +Answer: red_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d86c68870220d7026eefa375fd1a5a7d061cf25a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_16/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does Alexander think Logan thinks Evelyn thinks William thinks the carrot is? +Answer: red_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b933285d59ed95a71885e4cffdb55fcab817e653 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_17/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where is the lettuce really? +Answer: blue_container +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..56b943d8374ae1835d46ab9a55bfa3ec035b089b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_17/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Liam really think the lettuce is? +Answer: blue_crate +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..739e50d2be0cd9b7188f13c1ec54c2ecc15d878f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_17/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Emma think Liam thinks the lettuce is? +Answer: blue_crate +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c9e66586646bb188fe6eb36867c47bcbde41decd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_17/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Mila think Emma thinks Liam thinks the lettuce is? +Answer: blue_crate +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..571af1baf069d48bce280a57560347cdfff11234 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_17/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Avery think Mila thinks Emma thinks Liam thinks the lettuce is? +Answer: blue_crate +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..476f3c2902ca710cfea542b53c8543fdad97d034 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_18/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where is the corn really? +Answer: green_crate +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..78f06f4208e9ec0a04d4c13210d3425a4aafdf43 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_18/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Benjamin really think the corn is? +Answer: green_crate +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..90fbc5d7912181f01df3705911299607f5d1666b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_18/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Jackson think Benjamin thinks the corn is? +Answer: blue_treasure_chest +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c15cf93d27cb2bae73dd10888368ff393a78fe78 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_18/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Liam think Jackson thinks Benjamin thinks the corn is? +Answer: blue_treasure_chest +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..595aa4bacae0016bccd3ab5cdf6114687184e77b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_18/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Charlotte think Liam thinks Jackson thinks Benjamin thinks the corn is? +Answer: blue_treasure_chest +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..39e9fd744941357382d88746c89450aa1616731b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_19/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where is the asparagus really? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c2ce92c3b5b0c8bba704c5b00335ebbae34257e2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_19/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Emily really think the asparagus is? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ab198d79e5a680ca14246c4d12f095bbffdae088 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_19/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Hannah think Emily thinks the asparagus is? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a3a9c52d61d7afbb3b8738d2abe65c7e1184e8d6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_19/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Amelia think Hannah thinks Emily thinks the asparagus is? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b1e4124b6eb657bad588c0859b29598178089f4d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_19/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Abigail think Amelia thinks Hannah thinks Emily thinks the asparagus is? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..21798a09da10f456c9adc102733cae9f7b372fc2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_2/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where is the tomato really? +Answer: blue_container +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..462be88156f374a6e93c6b55b91ef57d7d275c39 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_2/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Jacob really think the tomato is? +Answer: blue_container +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4bf49de1769801b2116b05981da805fecd4debd7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_2/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Hannah think Jacob thinks the tomato is? +Answer: blue_container +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba1184c34f6dd1d20c89086a85b07de18d3e2728 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_2/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Isabella think Hannah thinks Jacob thinks the tomato is? +Answer: green_bottle +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4fe35f17f92b39161e5e870e2b3fffbcc8b21751 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_2/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Elizabeth think Isabella thinks Hannah thinks Jacob thinks the tomato is? +Answer: green_bottle +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b73e6477a54baecbf530eff2b130f823002471c9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_20/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where is the watermelon really? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1b097835f533504bd5b4722e0552d095d3c4f821 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_20/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Ava really think the watermelon is? +Answer: green_bottle +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6092bf5ebd5eb23fbd30dbb8631e83abb3d445f3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_20/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Jacob think Ava thinks the watermelon is? +Answer: green_bottle +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..49969b7ebb0e49b3de7f07dc70f7f5d177b145ef --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_20/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Emily think Jacob thinks Ava thinks the watermelon is? +Answer: green_bottle +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5e4e4f732038b999a850001a0a088445dbfe4e57 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_20/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Evelyn think Emily thinks Jacob thinks Ava thinks the watermelon is? +Answer: blue_cupboard +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8b9b0311eecf11dfc8a2cd29d38854038e5f0b18 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_3/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where is the eggplant really? +Answer: green_envelope +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5f91d9895d5e51b28c050aedc3c0751931cbdec --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_3/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Noah really think the eggplant is? +Answer: green_envelope +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b0944ff2efafdb98bdec64b9a9b3224375744353 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_3/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Hannah think Noah thinks the eggplant is? +Answer: green_bathtub +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..dbed26c5f35faaf1994d0bb2b00adf8242b8e078 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_3/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Jack think Hannah thinks Noah thinks the eggplant is? +Answer: green_envelope +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e509e7a75de73c54b2b978bdde0081aa7a0d8334 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_3/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Owen think Jack thinks Hannah thinks Noah thinks the eggplant is? +Answer: green_envelope +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ab3c251d4966ad78cf7d1b37b5ca3bd79fb84bf7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_4/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where is the spinach really? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..05e1cf403a7e599bef67fae46184686c6f4116dd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_4/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Noah really think the spinach is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..031cc49432ccac85a18ac31694476af517370c65 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_4/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Mila think Noah thinks the spinach is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad04cf90644eb0f56cf42183451581167cf87eb2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_4/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Emily think Mila thinks Noah thinks the spinach is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..30ead0597cbca213e0bb18896256629ec7759d42 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_4/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Evelyn think Emily thinks Mila thinks Noah thinks the spinach is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..29004e3b8e763b3560e5ebef531190eac7aa4d39 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_5/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where is the potato really? +Answer: red_bottle +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..87c0fed78b9edf718c300ec88f76aec86d02e6e3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_5/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Logan really think the potato is? +Answer: green_envelope +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5041aeef0f0a6a60828bae696e21bfcf3adf73a1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_5/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Benjamin think Logan thinks the potato is? +Answer: green_envelope +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..dc563c634f6ef48a7b57cd689d4cc3e07f8f17e8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_5/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Charlotte think Benjamin thinks Logan thinks the potato is? +Answer: green_envelope +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0decacc0ee8937fced849ecfc2f65db801f130fa --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_5/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Hannah think Charlotte thinks Benjamin thinks Logan thinks the potato is? +Answer: green_envelope +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..18f025f9831ce8773ca9927b99da3985b3e08fd2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_6/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where is the apple really? +Answer: red_box +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..38455f23ca4b708a43897379bf973103fe00bd06 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_6/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Lily really think the apple is? +Answer: red_box +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..42860e12abfbc827881c426b6f74ff94308cb916 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_6/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Hannah think Lily thinks the apple is? +Answer: green_bathtub +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cb6ccfd2bb61db94cbb4d70d40e745103d7303d0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_6/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Jack think Hannah thinks Lily thinks the apple is? +Answer: green_bathtub +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..46c68e12af81a04d3ec1c6ec28842a3cdbc1e7c7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_6/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Aiden think Jack thinks Hannah thinks Lily thinks the apple is? +Answer: green_bathtub +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..58038c44353c7300486902f0a137b5999493d4c1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_7/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where is the spinach really? +Answer: green_envelope +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc49987f1d58ae7d1211072bd26f81e8004c116c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_7/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Emma really think the spinach is? +Answer: green_envelope +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c5ad7fd074d822ed485a9a24c5b21dff916dcf47 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_7/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Ella think Emma thinks the spinach is? +Answer: red_bottle +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1fb1c08f236aac7a1086a724f3344300954a6c9e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_7/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Aiden think Ella thinks Emma thinks the spinach is? +Answer: red_bottle +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..264836cc9c00d044b7f6e3763fd7321833937e80 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_7/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Benjamin think Aiden thinks Ella thinks Emma thinks the spinach is? +Answer: red_bottle +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2df1ef1e9e83594d578dd6dcc5a6b67a03e338e6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_8/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where is the corn really? +Answer: blue_suitcase +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e78ed7d003ca2aec306ea46c644b387ce5da68ea --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_8/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Sophia really think the corn is? +Answer: blue_suitcase +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d2968fadd464257586e3c1356dcf9e942e4a8e6b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_8/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Chloe think Sophia thinks the corn is? +Answer: green_crate +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..747297084a0d4d04cef5b79935e9ed742c73ea38 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_8/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Ella think Chloe thinks Sophia thinks the corn is? +Answer: green_crate +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d3f0eb6f502674a60d1b1266302c9543c62b54f6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_8/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Owen think Ella thinks Chloe thinks Sophia thinks the corn is? +Answer: green_crate +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..53699b8b019c16281915726872c35bda7e17d64f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_9/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where is the banana really? +Answer: green_envelope +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..767d98cc8a0e6ab5a83fcee82f13e1bb8e09f62d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_9/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Abigail really think the banana is? +Answer: blue_bottle +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ab8596afd9de78f0a71f1a282d81c0368e9c04f4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_9/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Ella think Abigail thinks the banana is? +Answer: blue_bottle +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9e96302dc6ee2839771332d720cf87def2aa1054 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_9/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Elizabeth think Ella thinks Abigail thinks the banana is? +Answer: green_envelope +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5654b1fcafa6269f4ee2c880183b72e9e2e3b9b2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_1/sample_9/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Owen think Elizabeth thinks Ella thinks Abigail thinks the banana is? +Answer: green_envelope +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a66f42ca17beec5174ba45565a45888410e56ce8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_1/order_0.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where is the cucumber really? +Answer: green_treasure_chest +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ce8f2c9557b49c87741ab3d96721f71aa910aecb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_1/order_1.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Evelyn really think the cucumber is? +Answer: red_envelope +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1ed0d8df93e66207c74f5dc37a06fc6745000b18 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_1/order_2.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Ava think Evelyn thinks the cucumber is? +Answer: green_treasure_chest +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e00e0afd20471a51e7aca6a8573f5ca0a3e1bca8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_1/order_3.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Charlotte think Ava thinks Evelyn thinks the cucumber is? +Answer: green_treasure_chest +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1116a14d8156b53c734c3c5afa34c5fab548e982 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_1/order_4.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Jacob think Charlotte thinks Ava thinks Evelyn thinks the cucumber is? +Answer: green_treasure_chest +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3490a25ea7ba2c73ebde695318034462e80eeb4f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_10/order_0.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where is the orange really? +Answer: red_container +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b2f41597b3aa48aaecd5f0c1fba8ab87fd98d138 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_10/order_1.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Hannah really think the orange is? +Answer: red_pantry +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..702fa7229079b4b754f8b46d93e95d1b73c838e3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_10/order_2.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Aiden think Hannah thinks the orange is? +Answer: red_pantry +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7bf6da58cdd7b7fb830481eea2272223fb3218a1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_10/order_3.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Jack think Aiden thinks Hannah thinks the orange is? +Answer: red_pantry +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c12191d4ff5f90b6cc3379a39796177d3f258544 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_10/order_4.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Alexander think Jack thinks Aiden thinks Hannah thinks the orange is? +Answer: red_pantry +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b02c490d6d515810c559c2cc6ff80ca5ebf3bfcb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_11/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where is the cherry really? +Answer: blue_suitcase +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1a8d2a2fff8cfd273acca6b610f437bc24104d87 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_11/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Avery really think the cherry is? +Answer: blue_suitcase +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..bcf70b5ee1637c0b1de8937caeb2665a55cd8197 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_11/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Lily think Avery thinks the cherry is? +Answer: red_container +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ecd625373ef000213e6bcca2a5074c8809d74bf8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_11/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Ella think Lily thinks Avery thinks the cherry is? +Answer: red_drawer +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b8bc7cc908923f337c6c8f5920fa41eda9ad553c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_11/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Emily think Ella thinks Lily thinks Avery thinks the cherry is? +Answer: red_drawer +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..09c2e1eaeb07c60b63e40f10a1c31bc50b85e3ce --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_12/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where is the pear really? +Answer: red_bucket +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6b128a1301829899244d4b7cdc1055115711e594 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_12/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does Charlotte really think the pear is? +Answer: red_bucket +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7d87ea897e3658612746dacfe0d2183b27a45d3b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_12/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does Alexander think Charlotte thinks the pear is? +Answer: red_bucket +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cbf0625f4d3278f15c7c8ecfbf0a33460dabe2f2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_12/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does Ava think Alexander thinks Charlotte thinks the pear is? +Answer: red_box +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..554f10a5c93ba134a91f0575ca7becf943e474dd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_12/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does William think Ava thinks Alexander thinks Charlotte thinks the pear is? +Answer: red_box +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..93a85dd4f7f5430561b7f5d86b8d2507b7f3c931 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_13/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where is the watermelon really? +Answer: green_basket +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5a5df65bfa548c8d66cb86dbe34e94ddf0bbdf3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_13/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Carter really think the watermelon is? +Answer: green_basket +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..604bfd285a566c393caefc1b0f2a1c099eedf0ab --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_13/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Avery think Carter thinks the watermelon is? +Answer: blue_suitcase +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ccec7fa7ffe09bedf192b6aa53ba1553ffce4726 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_13/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Isla think Avery thinks Carter thinks the watermelon is? +Answer: blue_suitcase +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..da9ff330a17bdd3eca8be34597190fc0ce007963 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_13/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Sophia think Isla thinks Avery thinks Carter thinks the watermelon is? +Answer: blue_suitcase +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2bcc496f2ae2e9526d5342e54690f9d7cca13834 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_14/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where is the lemon really? +Answer: green_bottle +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..43e37ef5e87cdabbb34cf8f1ff176b4c3d70397f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_14/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Isla really think the lemon is? +Answer: red_container +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..fd9c67f6e9a62aca1b49bb04a66740f399b819fe --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_14/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Sophia think Isla thinks the lemon is? +Answer: red_box +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c01da5318e277926f5f94e7eb60a0d57730d4ced --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_14/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Evelyn think Sophia thinks Isla thinks the lemon is? +Answer: red_box +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..44b7fe5b4244d5a11ba2b85948e5fc42fe586bd2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_14/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Alexander think Evelyn thinks Sophia thinks Isla thinks the lemon is? +Answer: red_box +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e3ed8f67d3def5fc4df7aa549f90b6db9c323e58 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_15/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where is the corn really? +Answer: green_bucket +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..99ab90e32d26daebf2f92493dc424de14b1ab72a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_15/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Abigail really think the corn is? +Answer: green_bucket +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c5c88b7ae3b610549585acc98d380a28ed6d1a2d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_15/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Nathan think Abigail thinks the corn is? +Answer: red_basket +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e6ae2a845dbbc71c0883310f7a10e20d8d32400f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_15/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Avery think Nathan thinks Abigail thinks the corn is? +Answer: red_basket +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..edc27e88c059b7af4f08380d7c411f54d22a3a19 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_15/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Hannah think Avery thinks Nathan thinks Abigail thinks the corn is? +Answer: red_basket +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4776243b9a655fbcc3ad43e0036e7069dac4d227 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_16/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where is the tangerine really? +Answer: green_bottle +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..762436403924671582906035559c2775e0590426 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_16/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Benjamin really think the tangerine is? +Answer: red_bucket +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1448748b666f880411b85f5670da83d0351ad96c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_16/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Liam think Benjamin thinks the tangerine is? +Answer: green_bottle +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..670ffa765143909bd491e1e49360bc950d8b8fd8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_16/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Carter think Liam thinks Benjamin thinks the tangerine is? +Answer: green_bottle +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..292680ad1268a03c9f28d7d6d859ddb092f3c133 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_16/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Jackson think Carter thinks Liam thinks Benjamin thinks the tangerine is? +Answer: green_bottle +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..22ff639cb98c95cca03a9a4715b768648d7dc071 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_17/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where is the lime really? +Answer: green_pantry +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..af9cda0a4bc11f392657f1256dae910e164f5627 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_17/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Owen really think the lime is? +Answer: blue_drawer +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a104a3f02e60cdd4a05183b72c9fa17d9d86a902 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_17/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Emily think Owen thinks the lime is? +Answer: red_bottle +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca6636191312b82da2ec18ac2d799020b1f43c50 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_17/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Lily think Emily thinks Owen thinks the lime is? +Answer: red_bottle +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..14e28b5b60b97c28298f2ef97a5464367c1bcc68 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_17/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Ella think Lily thinks Emily thinks Owen thinks the lime is? +Answer: red_bottle +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e3c9ade78dfabb95519ad1ba22a8600b2b6eb059 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_18/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where is the corn really? +Answer: blue_container +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..96e225e72f8ef15cce3ab2200bc1f4f5c8908864 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_18/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Noah really think the corn is? +Answer: blue_treasure_chest +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6cd6fcc97e7e8e0c4a1e1d2db57ab1aaa0dd4ab5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_18/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Lily think Noah thinks the corn is? +Answer: blue_treasure_chest +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..06840beb675e04666ba4e357d2bfcff7371e252e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_18/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Isla think Lily thinks Noah thinks the corn is? +Answer: blue_treasure_chest +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3544ae9f30e1ecb1417f9b081b22c96412cf25fd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_18/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Mila think Isla thinks Lily thinks Noah thinks the corn is? +Answer: blue_treasure_chest +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4a243f98bb95b538f4ba8fe78a97c662c2984501 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_19/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where is the tomato really? +Answer: blue_container +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d9706e422efb341b9676530f43fc1048cc6a5505 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_19/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Jackson really think the tomato is? +Answer: blue_crate +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..46be924431412068ac8d49ae5c9d56dfbe811e09 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_19/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Nathan think Jackson thinks the tomato is? +Answer: blue_crate +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5627939900e374924bc0ae895b2186e09a58cbeb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_19/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Amelia think Nathan thinks Jackson thinks the tomato is? +Answer: blue_crate +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..cf4cb52e8da8d5523cf0e6b771c58dc6a905f8f0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_19/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Sophia think Amelia thinks Nathan thinks Jackson thinks the tomato is? +Answer: blue_container +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..26d415499182eeb856de09ba922547ee74235488 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_2/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where is the corn really? +Answer: red_basket +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..64ac03c7498bc58ab63fec764103738c361e5625 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_2/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Amelia really think the corn is? +Answer: red_basket +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3ab4145ede14397d0f45a3b4d8b5c496d7895d1e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_2/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Lily think Amelia thinks the corn is? +Answer: red_container +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..fe8d9571a5468bf83e095e04e1faffb98eb7d564 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_2/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Sophia think Lily thinks Amelia thinks the corn is? +Answer: red_container +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f143babec8ba4da53e01e163e8c293f106fc48d8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_2/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Liam think Sophia thinks Lily thinks Amelia thinks the corn is? +Answer: red_basket +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f3f1f98e5435c17973172ba53c116db509d3cbe6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_20/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where is the peas really? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3d17719da7956d7fd64d06b22fa671b7077bbed8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_20/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Nathan really think the peas is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..dd0e85c7c20ce2f7ad5fabb7fc5e2ba986a0285c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_20/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Emily think Nathan thinks the peas is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..22a7715a0aa9e62c6a15d2e4b85e13c5560b0b7d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_20/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Ella think Emily thinks Nathan thinks the peas is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9a7144f39e5036f3c5de56f00eb372fd3c9468d9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_20/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Evelyn think Ella thinks Emily thinks Nathan thinks the peas is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8619491419c6220d1544d0d27edddb90fdd287bc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_3/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where is the peas really? +Answer: blue_crate +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e2353ae801bf12fd30eb415a9a220d1a1088d589 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_3/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Benjamin really think the peas is? +Answer: blue_crate +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..59985231dea05fa07db2fcca76b1cd36413c5363 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_3/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Noah think Benjamin thinks the peas is? +Answer: blue_container +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..714a875882371368a785487ae9fbea33fa1072fd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_3/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Liam think Noah thinks Benjamin thinks the peas is? +Answer: green_drawer +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..048e0eca080b10df906485c5bcd41b3d82450e77 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_3/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Avery think Liam thinks Noah thinks Benjamin thinks the peas is? +Answer: green_drawer +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b19a384a67059effd206620f4d3800992479bac1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_4/order_0.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where is the potato really? +Answer: blue_drawer +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..93cd42201fed60370bd6a9c8fdbde96be7a4e349 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_4/order_1.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Isabella really think the potato is? +Answer: green_bottle +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..27bd9988ce94af871424f9edf3fc45bdf18614a9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_4/order_2.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Chloe think Isabella thinks the potato is? +Answer: blue_drawer +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4524ade7affd12d09bccaa84a5ec1cad870749cb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_4/order_3.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Evelyn think Chloe thinks Isabella thinks the potato is? +Answer: blue_drawer +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9cefb051b3679c05b87b9b2b700838944b0d7831 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_4/order_4.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Jacob think Evelyn thinks Chloe thinks Isabella thinks the potato is? +Answer: blue_drawer +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5d560aef8676abf8e9cad3229c6d43b80657eb5d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_5/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where is the cabbage really? +Answer: green_envelope +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..775f3af994694d2e67a0e5813301e7eb44264ef4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_5/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Avery really think the cabbage is? +Answer: green_envelope +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c21e2bfa81e8fa632104e322bf76eb58e2005b1f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_5/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Aiden think Avery thinks the cabbage is? +Answer: green_box +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b253118c5c3237a001f52cde07c24ee3dfe6dc7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_5/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Emma think Aiden thinks Avery thinks the cabbage is? +Answer: green_envelope +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3a37c8c85649370c671f4a1eeac999a169e58a9b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_5/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Noah think Emma thinks Aiden thinks Avery thinks the cabbage is? +Answer: green_envelope +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3fd9c085a9e3d68df7b294830e014424b9358827 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_6/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where is the melon really? +Answer: red_pantry +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..db05e0ba1128f5413093a2cbbae88044b82a9a30 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_6/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Owen really think the melon is? +Answer: green_basket +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..055b6dc0d3f60dd05f9a42489b11d19034989171 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_6/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Avery think Owen thinks the melon is? +Answer: green_basket +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..fa807c1305f3fe25008dd0e0104fd8458e9d5c79 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_6/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Benjamin think Avery thinks Owen thinks the melon is? +Answer: red_pantry +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0c6f14461a8abe7faa41e9d5768d737991c85752 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_6/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Noah think Benjamin thinks Avery thinks Owen thinks the melon is? +Answer: red_pantry +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..12270676cefffa11082e3f5ebf816d20580d87b8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_7/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where is the melon really? +Answer: blue_treasure_chest +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8677b1890c3b51d39b362f067e25e0797a7d8401 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_7/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Nathan really think the melon is? +Answer: blue_treasure_chest +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..37b98ceac45e1a064d1e7010112e30563cdeff93 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_7/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Lily think Nathan thinks the melon is? +Answer: blue_treasure_chest +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a7fa865270e0a2f7bce1195aeef13730af41a427 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_7/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Isabella think Lily thinks Nathan thinks the melon is? +Answer: blue_container +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e6ef14a72b94b70c143d5c7f0e19d123e4c7f545 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_7/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Ava think Isabella thinks Lily thinks Nathan thinks the melon is? +Answer: blue_container +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b6ab7a7df2abe135bc2d2c063e0860564a3066ab --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_8/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where is the watermelon really? +Answer: blue_treasure_chest +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..36b515e5ea96ffb4f4bab83476c3ff461455ffab --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_8/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Noah really think the watermelon is? +Answer: blue_treasure_chest +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6faf71acb413f67b6a9ce5f25583af4aa7060b65 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_8/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Emma think Noah thinks the watermelon is? +Answer: green_bucket +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f380c0102ae134c17e5624e99b37c9ddf34ab30b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_8/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Liam think Emma thinks Noah thinks the watermelon is? +Answer: green_bucket +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d56da01139b19cfd78f0ab302011ea0fb0b5b4f9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_8/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Owen think Liam thinks Emma thinks Noah thinks the watermelon is? +Answer: green_bucket +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a0855954c1c81b04a3d281d578845eda1eb8b72e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_9/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where is the carrot really? +Answer: red_basket +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7c1f8828f4b7d29e5b159a4e2f1a9741b9e3ff94 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_9/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Noah really think the carrot is? +Answer: red_basket +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b5b929e52d0134d6722a3aa4e832bf4d56484131 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_9/order_2.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Owen think Noah thinks the carrot is? +Answer: red_pantry +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7a75d6268dabbb02320d181dfc4e683d7fa5bf98 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_9/order_3.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Mila think Owen thinks Noah thinks the carrot is? +Answer: red_pantry +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e1311f4887834a103efddcda1fa37ee4dc17b4e0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_2/sample_9/order_4.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Lily think Mila thinks Owen thinks Noah thinks the carrot is? +Answer: red_basket +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..dbabf0a405e8cd75f28a02b0de373b1f1f6e3704 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_1/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where is the lettuce really? +Answer: blue_container +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0e7369208161365f0feccfca5900f9fcfa5f051d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_1/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Isabella really think the lettuce is? +Answer: blue_container +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2f4a20f84486cc17597c4187d29edb708727a71e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_1/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Abigail think Isabella thinks the lettuce is? +Answer: blue_treasure_chest +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..625f298cb3cf19812fec336e9ab794926f54224a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_1/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Nathan think Abigail thinks Isabella thinks the lettuce is? +Answer: blue_container +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ae6a9ce7b851b3659a9fdb50488cfd158cfd2b0f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_1/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Logan think Nathan thinks Abigail thinks Isabella thinks the lettuce is? +Answer: blue_container +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0a961e68dc3b9bbe275e755864ed89ad32aa835a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_10/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where is the sweet_potato really? +Answer: red_container +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9ea68dd233abef5e1d5f1d4991b4d1d13d98e605 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_10/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does Evelyn really think the sweet_potato is? +Answer: blue_cupboard +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4b08c5a7cb2f4a884c66f576bfe4fe968571c143 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_10/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does Logan think Evelyn thinks the sweet_potato is? +Answer: red_container +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f1d95888d687705f9e32ae7ef76b27eaf6d463a3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_10/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does Charlotte think Logan thinks Evelyn thinks the sweet_potato is? +Answer: red_container +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..45eb271eaab9a6901de27faf595acab4d6b92115 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_10/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does William think Charlotte thinks Logan thinks Evelyn thinks the sweet_potato is? +Answer: red_container +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f958469bfe8a502f55a802cfcfb85ccd80edc324 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_11/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where is the melon really? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..86dc085bdcd142056178aa13168cdf49b052e9a1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_11/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does William really think the melon is? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a1ae18732fb90c57ee4b8918eb0f9aa81a82c8a1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_11/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does Lily think William thinks the melon is? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f57107a9f4e6311cf93089865320a53805678fda --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_11/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does Emma think Lily thinks William thinks the melon is? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e7f6e7607bc673e9ed5af943a2eca64bc6e8808f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_11/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does Isla think Emma thinks Lily thinks William thinks the melon is? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..abff96137ca9795ff89fc5ce1ea90c5f030d4b43 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_12/order_0.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where is the beans really? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..03ff34c0e0904b83e8692a075dc3a02921d7345d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_12/order_1.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Jack really think the beans is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b9d9fd7c2ec5ae709091236c45cad2cee49795a6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_12/order_2.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Owen think Jack thinks the beans is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f86aee4b935cc2c175cc441ec59f6e18228b434 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_12/order_3.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Liam think Owen thinks Jack thinks the beans is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c8d249ac820d8e825de8efe11538c8f1426bc3c7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_12/order_4.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Benjamin think Liam thinks Owen thinks Jack thinks the beans is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5e9a3d2ffddabf237c01f27a9e83431ee3be7407 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_13/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where is the corn really? +Answer: green_bottle +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f355c99cf201d88fbcdeb7dbefc07a1bbcce3eb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_13/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does William really think the corn is? +Answer: green_bathtub +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f3ed57facf44705c1178c5136f8c8bf8cdecbdb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_13/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does Emily think William thinks the corn is? +Answer: green_bathtub +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7db61bb2a258c05545035c74931d4192877c17d7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_13/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does Emma think Emily thinks William thinks the corn is? +Answer: green_bathtub +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4843e693bf326720386b513317b535e989f51bd8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_13/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does Jackson think Emma thinks Emily thinks William thinks the corn is? +Answer: green_bathtub +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..67a97fb4b423a59d423ff63dff0242e5ac831a50 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_14/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where is the cucumber really? +Answer: red_pantry +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1f87d245475c10207e42db62d4a9a8a93010f974 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_14/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Avery really think the cucumber is? +Answer: red_pantry +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..fc2be9265cb3849a78f193789cdbde57158f351e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_14/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Abigail think Avery thinks the cucumber is? +Answer: blue_drawer +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8541ee083f730e8d26a568530e5b9a747dbc92dc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_14/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Hannah think Abigail thinks Avery thinks the cucumber is? +Answer: blue_drawer +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a6a5f16628a2814d076ec5a64372cb2c28aa2f14 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_14/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Owen think Hannah thinks Abigail thinks Avery thinks the cucumber is? +Answer: blue_drawer +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..14b4014600699bd6ee0c4e5f938cd67b666ef5ab --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_15/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where is the sweet_potato really? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a7cc3d963bc0d5a800b1719f241293e00e4cb902 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_15/order_1.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Jacob really think the sweet_potato is? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..21b77a27b86e487f2b1d1ec11664f10e5575b3f2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_15/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Aiden think Jacob thinks the sweet_potato is? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..3b5cf6fe7871c3398fdbbb44df744e57dbd0f0bd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_15/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Mila think Aiden thinks Jacob thinks the sweet_potato is? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6068f2b1d9f17be319d8a5297594a694b6b17ba0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_15/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Elizabeth think Mila thinks Aiden thinks Jacob thinks the sweet_potato is? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..23bfbef2ff8489ca2d6ca5058bbe0c4943337498 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_16/order_0.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where is the persimmon really? +Answer: red_basket +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..819b7d24f54a417d75bdfbadd19fa87f99f74aa3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_16/order_1.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does William really think the persimmon is? +Answer: red_basket +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2ba65aa2591129f3afaae8076c73c93c25d6ae4e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_16/order_2.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does Hannah think William thinks the persimmon is? +Answer: red_basket +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..23866d91fcd30e3ee2c6253478b1a0dfaee2f47d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_16/order_3.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does Avery think Hannah thinks William thinks the persimmon is? +Answer: red_basket +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e60418623fbc152f50891a4a2e4abaf8df5cc22b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_16/order_4.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does Alexander think Avery thinks Hannah thinks William thinks the persimmon is? +Answer: red_basket +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e997869cccb10075ada8a2ddd5d360b728232ed1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_17/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where is the eggplant really? +Answer: green_pantry +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..481f985dec3abff08c38f243fe293abe6969bfc5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_17/order_1.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Emma really think the eggplant is? +Answer: green_pantry +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8fd4c412c327710646286be46393d94f4ba64756 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_17/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Jackson think Emma thinks the eggplant is? +Answer: green_box +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..080c31428512f508776ca59ff63cb3268920dc92 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_17/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Jack think Jackson thinks Emma thinks the eggplant is? +Answer: green_box +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b2f486ff037c54797c71a9a10b64fd98a4e59461 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_17/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Emily think Jack thinks Jackson thinks Emma thinks the eggplant is? +Answer: green_pantry +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..dccb26e92f98004604d72dce8e3855cb60e2632f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_18/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where is the lime really? +Answer: blue_crate +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..be4f3a8f275cc53f7096868fe91ff1a984eee6c5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_18/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Elizabeth really think the lime is? +Answer: green_pantry +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f65649d2570eee16d1b1013e3fb829e661ef1b6f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_18/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Alexander think Elizabeth thinks the lime is? +Answer: green_pantry +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..0b617ce5d11fcfa779461048b42a98ca7915529c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_18/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Owen think Alexander thinks Elizabeth thinks the lime is? +Answer: blue_crate +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..862fa11f37668cba3e2780e55157d29696acfe94 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_18/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Nathan think Owen thinks Alexander thinks Elizabeth thinks the lime is? +Answer: blue_crate +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..28fee0a13c8705a1de80c77a5c5db9f7844eaec9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_19/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where is the pear really? +Answer: blue_crate +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..771b84f03605d0fb664d55f061694f37920b6a0b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_19/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does Noah really think the pear is? +Answer: blue_crate +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b9900f75c35c807ee0717288de3df5f7d218c78a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_19/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does William think Noah thinks the pear is? +Answer: blue_drawer +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..3629225060eb23046b4f6778cc61df98dacab81a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_19/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does Isabella think William thinks Noah thinks the pear is? +Answer: blue_crate +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f0f2c4907c49fe23cda3cb4d04c28e6b4e4e7675 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_19/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does Aiden think Isabella thinks William thinks Noah thinks the pear is? +Answer: blue_crate +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3075d12e4541f00657e6a8805b013c0b7585b49b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_2/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where is the onion really? +Answer: blue_bottle +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c88eb2e4684d368273f3fa731d18cb3e198773b5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_2/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Nathan really think the onion is? +Answer: blue_bottle +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e6eaa4c8cca8fadbd9eac4b437d81ff2e9346ce0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_2/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Emily think Nathan thinks the onion is? +Answer: blue_treasure_chest +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..03d2009a344f0722ebfcdc1599536bbea4e319a6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_2/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Owen think Emily thinks Nathan thinks the onion is? +Answer: blue_treasure_chest +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d9d64bb3670fb10f394f0eac63700369dfc005f1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_2/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Liam think Owen thinks Emily thinks Nathan thinks the onion is? +Answer: blue_treasure_chest +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e86cdecdcd07989f30e4a6eac4cc0a01aa1c8e39 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_20/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where is the spinach really? +Answer: blue_treasure_chest +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..25f3c17cb2aa065cfb1e1240a0c5d00919721592 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_20/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Evelyn really think the spinach is? +Answer: blue_treasure_chest +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a858327ef561647eaff9982f9b4b51c185e2b754 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_20/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Jackson think Evelyn thinks the spinach is? +Answer: green_drawer +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5d46bad42f012732453041004aec6b49baecf81f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_20/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Liam think Jackson thinks Evelyn thinks the spinach is? +Answer: green_drawer +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e3f8aae5591f8ae27780ed536785ac7e47f9ca52 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_20/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Elizabeth think Liam thinks Jackson thinks Evelyn thinks the spinach is? +Answer: green_drawer +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..882b780f5a649ea92725d81af2af6a52191f459b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_3/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where is the peas really? +Answer: blue_cupboard +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c11182d80411be2e4a97fdae12cb1bb6f0040bed --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_3/order_1.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Isla really think the peas is? +Answer: blue_cupboard +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..540f9fbe32391f54f467a7ce394a05cda09eb005 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_3/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Amelia think Isla thinks the peas is? +Answer: blue_cupboard +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9931d1d3e6388fde49ce71dc9982212607a5de8d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_3/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Carter think Amelia thinks Isla thinks the peas is? +Answer: blue_cupboard +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..cb141ebc52498b37365c76b5f7cf301dd72e407b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_3/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Mila think Carter thinks Amelia thinks Isla thinks the peas is? +Answer: green_treasure_chest +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1c6ae2d28e59273acc1279307f960184a8626a7f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_4/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where is the green_pepper really? +Answer: blue_container +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5afdc9d098158e3dca326ff63d0f5cdea406e72f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_4/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Emma really think the green_pepper is? +Answer: blue_container +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ea07560bf6070c4f7aa100ad4fa00387f6f72f8a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_4/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Benjamin think Emma thinks the green_pepper is? +Answer: red_basket +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ff09a78505c7374cbfe8da0378aba64311346b07 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_4/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Jackson think Benjamin thinks Emma thinks the green_pepper is? +Answer: red_basket +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3fe6ab93945afde9af0a39af9318a61849e5912b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_4/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Abigail think Jackson thinks Benjamin thinks Emma thinks the green_pepper is? +Answer: red_basket +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0aa7b505ceda97750965da02616a2832aedc787e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_5/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where is the peas really? +Answer: blue_bathtub +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..73d368790e55e430909ab78bb8155259a6882f95 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_5/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Hannah really think the peas is? +Answer: blue_bathtub +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..890456c1b23bd0b4a497eff07fc8d9b688d7c3b2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_5/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Amelia think Hannah thinks the peas is? +Answer: green_basket +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9ffc46715b7a03dba2d9b9355fba26c541e49d28 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_5/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Jackson think Amelia thinks Hannah thinks the peas is? +Answer: green_basket +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ede25f3eb01821b9c8bd377b5f4e07ccc82c7375 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_5/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Abigail think Jackson thinks Amelia thinks Hannah thinks the peas is? +Answer: green_basket +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d092b8109f167f935e25da6626fe9673c6cbe6c9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_6/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where is the turnip really? +Answer: blue_pantry +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..67f69fe231923281a1e6db64338617b71b161e7a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_6/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Hannah really think the turnip is? +Answer: blue_pantry +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..695f9bcfae9c07ea6d518236744d73db6f38d0ab --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_6/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Lily think Hannah thinks the turnip is? +Answer: red_basket +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..37d2a8e963cd4deddccd35247ad04211b044f168 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_6/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Noah think Lily thinks Hannah thinks the turnip is? +Answer: red_basket +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..91b21891ca390dc5990a569973095d23d1c235b1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_6/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Logan think Noah thinks Lily thinks Hannah thinks the turnip is? +Answer: red_basket +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d2ca07c1dc53e575d3b4786d9ceef00939fea117 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_7/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where is the watermelon really? +Answer: red_bottle +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..09bb54b1486cb688a42716af683745b8a31cd358 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_7/order_1.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Evelyn really think the watermelon is? +Answer: green_cupboard +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..321f94a23a3a414873ca36cfe609ebcf8e9fe0b7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_7/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Logan think Evelyn thinks the watermelon is? +Answer: green_cupboard +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1367f6dac580197d7951621a8701fec23d101bdb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_7/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Chloe think Logan thinks Evelyn thinks the watermelon is? +Answer: green_cupboard +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..201b7a91148aedcfb42c864e175232132f324ad5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_7/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Charlotte think Chloe thinks Logan thinks Evelyn thinks the watermelon is? +Answer: green_cupboard +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..78ee1f0ff74a12f74c380d78c947402ec7387e98 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_8/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where is the lemon really? +Answer: green_drawer +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a6b609d5c2f64da323aefee975b85cf5d6188ae0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_8/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Aiden really think the lemon is? +Answer: green_basket +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2f47cfc7953e9cc7b79d5a65ac6c0a6714832ee5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_8/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Nathan think Aiden thinks the lemon is? +Answer: green_basket +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cca87ac85cf0a3a695da52e4c2239bfd53485e91 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_8/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Jack think Nathan thinks Aiden thinks the lemon is? +Answer: green_drawer +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6a8acfb3beec6d209a32d64114cb2b9a609ce7c6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_8/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Liam think Jack thinks Nathan thinks Aiden thinks the lemon is? +Answer: green_drawer +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d4b45e2ff72a40750ed0d9edf07f0cf159232d69 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_9/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where is the cabbage really? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..73967d76c0c384ad4d21ebf35c5032502bef3b53 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_9/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Isla really think the cabbage is? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c05b06224270d3d9c64eae9dbdab427d9d7e9284 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_9/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Elizabeth think Isla thinks the cabbage is? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7cd63e54b41082ce383ba88b4a487cdf2b609525 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_9/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Abigail think Elizabeth thinks Isla thinks the cabbage is? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..96423f3b705c1a7ae5a3901f6e67be691591fb7c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/No_Tell/MC/length_3/sample_9/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Aiden think Abigail thinks Elizabeth thinks Isla thinks the cabbage is? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..53cafc83361a4f76c32b619bf374b0a531a124f1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_1/order_0.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where is the carrot really? +Answer: red_basket +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..dfbd9668a3c032870ad517d793c3cd7403c20531 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_1/order_1.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does William really think the carrot is? +Answer: green_envelope +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f7ff3cdb909d9825f935cb5b24591859fca82fa4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_1/order_2.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does Hannah think William thinks the carrot is? +Answer: red_basket +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9ca3e9f8adffc2a04812155195d9ced188227e7d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_1/order_3.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does Jack think Hannah thinks William thinks the carrot is? +Answer: red_basket +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e45897fa3be64fdc7d752fa0a9b0e3c46c12c8cc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_1/order_4.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does Charlotte think Jack thinks Hannah thinks William thinks the carrot is? +Answer: red_basket +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..48d0399006f26d1ec476f740747c0f74e7f42244 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_10/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where is the potato really? +Answer: green_cupboard +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1ab868c095e7446e94511a5225be1b0af1d29a33 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_10/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Carter really think the potato is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..da78c9fe184f935e310bc58652905e9d1fec7131 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_10/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Jacob think Carter thinks the potato is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..36acb3b67667393fe072629fc3ce46b52f296af7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_10/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Alexander think Jacob thinks Carter thinks the potato is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..25e3e788c76fd7578f28a89d3fb36470d0d6d447 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_10/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Jackson think Alexander thinks Jacob thinks Carter thinks the potato is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..154fc68e1096420ab8bad180193f6bb819018c02 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_11/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where is the pear really? +Answer: red_pantry +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..21fa36f615c73a001e6cf986a9f921b68776f1b7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_11/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Sophia really think the pear is? +Answer: red_pantry +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..24a3b1f7df082de969538f5e0e78ceee787de664 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_11/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Ava think Sophia thinks the pear is? +Answer: green_envelope +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e672ac454525e6cb674346598e75f99208da7e62 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_11/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Avery think Ava thinks Sophia thinks the pear is? +Answer: green_envelope +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6c0290fe598bc0a2538108644339bbfefb3afdbe --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_11/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Mila think Avery thinks Ava thinks Sophia thinks the pear is? +Answer: green_envelope +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f1f8c8936720c7b53ed581f2cfd9494c43d3428 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_12/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where is the tangerine really? +Answer: red_basket +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6796016080081437caab9958fed489e604a80a9b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_12/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Ava really think the tangerine is? +Answer: red_basket +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..0700e19c12186178e6a1e5146575c78eaae15133 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_12/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Logan think Ava thinks the tangerine is? +Answer: green_box +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..261ee1ccac063a8574d7da3bb9e8511b798edcfd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_12/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Owen think Logan thinks Ava thinks the tangerine is? +Answer: red_bottle +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b3cc1773bfda9d7507ea5077f4ab3c5aef538a1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_12/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Elizabeth think Owen thinks Logan thinks Ava thinks the tangerine is? +Answer: red_bottle +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a66688d275afdf7b3013a7a05bd6949ce6d8f7bb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_13/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where is the onion really? +Answer: red_crate +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8c39871d576231f7992d914b352b10de2a657c0c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_13/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Owen really think the onion is? +Answer: red_crate +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f270b1c1d8a798ea2048a05076b7c5690c4a5ab1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_13/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Elizabeth think Owen thinks the onion is? +Answer: green_bucket +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..fae656868c9ea807ceb80b339cc6450491e8e9b9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_13/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Liam think Elizabeth thinks Owen thinks the onion is? +Answer: red_crate +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1ec00b46b4af19337027274f0c8bb4b632d42ad5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_13/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Noah think Liam thinks Elizabeth thinks Owen thinks the onion is? +Answer: red_crate +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1388c9a81f5c75a42e3b60424be31993545e5538 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_14/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where is the tangerine really? +Answer: green_treasure_chest +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..091e3a8c2cc6ef346513fcf44af581ec277c1ff3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_14/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Mila really think the tangerine is? +Answer: red_box +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..76b5814df0b68a8c5498285d28d5971c06a8bda4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_14/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Amelia think Mila thinks the tangerine is? +Answer: red_box +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..60d3b14296843f4d7bd03e17809ab7ddb9ff8652 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_14/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Elizabeth think Amelia thinks Mila thinks the tangerine is? +Answer: green_treasure_chest +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e200199964d1317533267db3aa1ba6f0c3753948 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_14/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Chloe think Elizabeth thinks Amelia thinks Mila thinks the tangerine is? +Answer: green_treasure_chest +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1818df801d1b313e9f33a3ad383a9939e531d426 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_15/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where is the tangerine really? +Answer: red_basket +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..711c3e99a9cee1301de1f49298acdaf89c765b87 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_15/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Amelia really think the tangerine is? +Answer: green_bottle +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8e5e10fe7eb75c0ab8932a04b545522653198e98 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_15/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Ava think Amelia thinks the tangerine is? +Answer: red_basket +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6b977bc8677e50643b55f409dfc922a151875486 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_15/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Carter think Ava thinks Amelia thinks the tangerine is? +Answer: red_basket +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b46eaff9fc67013009badc0572ea4595b868126b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_15/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Abigail think Carter thinks Ava thinks Amelia thinks the tangerine is? +Answer: red_basket +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0daf6b8542ac94e9311e0eec375ed1df699fcf89 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_16/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where is the tomato really? +Answer: red_crate +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca82964a3ccf390ac9677d19807907ac5df5fc0d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_16/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Jack really think the tomato is? +Answer: green_box +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..15af3bed72e06e40c8622e8f43149697b7d0d09f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_16/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Isla think Jack thinks the tomato is? +Answer: green_basket +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e55cb352446681bdb822351471693a4ec4bdc7e6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_16/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Carter think Isla thinks Jack thinks the tomato is? +Answer: red_crate +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc1b36f2beef42b0fccc3b4abd21bea14fdd3762 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_16/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Aiden think Carter thinks Isla thinks Jack thinks the tomato is? +Answer: red_crate +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fc4766f78622c60482daed8d7065af4cdcbf8d70 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_17/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where is the green_pepper really? +Answer: blue_treasure_chest +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ed1d3fd3ff55663bed5bb4c19d5c3b4611d0ce92 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_17/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Alexander really think the green_pepper is? +Answer: blue_crate +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c4b9bc12c769fcb26c886699a35e389b0f9625f9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_17/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Evelyn think Alexander thinks the green_pepper is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..03642eb8aa544150d3ab6cd67a420bb5ec4fec29 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_17/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Hannah think Evelyn thinks Alexander thinks the green_pepper is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..93a9c4b55b0f4b455afad4dd7575342d915734e8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_17/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Abigail think Hannah thinks Evelyn thinks Alexander thinks the green_pepper is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3ebf87fab54dfcfce39c1b82ea99022f339d53a3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_18/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where is the cabbage really? +Answer: red_box +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6bb516a38458ad0eb375eaa86f7f6c536f6a2e54 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_18/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does William really think the cabbage is? +Answer: red_box +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..44eb47af9939aa12a21e8b9bbc01eafe9007a7c8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_18/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does Nathan think William thinks the cabbage is? +Answer: red_box +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..445523fd6bf7cf04d6ef4fcbd494e93d21c8f9a4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_18/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does Aiden think Nathan thinks William thinks the cabbage is? +Answer: red_box +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..63ac83513ffe572cee76cb2d003904275669a31a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_18/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does Logan think Aiden thinks Nathan thinks William thinks the cabbage is? +Answer: green_pantry +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1c8d915d099b5de5c9c47d9ee3811c905259782d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_19/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where is the green_pepper really? +Answer: blue_crate +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6d73137aab12f7c99f42eb9495e5af40f98ad4e5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_19/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Logan really think the green_pepper is? +Answer: blue_crate +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..49d3cefedb485535cc58c426d067b07050c06aeb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_19/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Lily think Logan thinks the green_pepper is? +Answer: red_drawer +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f12ed8f42f456a5a950619f414b11aa26803244 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_19/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Ella think Lily thinks Logan thinks the green_pepper is? +Answer: red_drawer +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5555e8c2025439459ee7de22867205894229c6fc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_19/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Elizabeth think Ella thinks Lily thinks Logan thinks the green_pepper is? +Answer: red_drawer +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..075c0eec67949da15a6e52c6f95a06a414a14c09 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_2/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where is the lemon really? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..263760ccdff26804b762d7b458282673230514ec --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_2/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Lily really think the lemon is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..31381d0ede670ddf1a91576ab2afca06586ec9bf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_2/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Avery think Lily thinks the lemon is? +Answer: blue_pantry +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..77009fab8b74daada3c2c889b6aaffe46558cca4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_2/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Liam think Avery thinks Lily thinks the lemon is? +Answer: blue_treasure_chest +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7669b07d6e152c7e406a9ae94f63da382445f822 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_2/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Noah think Liam thinks Avery thinks Lily thinks the lemon is? +Answer: blue_treasure_chest +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a6525db63ab108d6915b1fb5d52042771809bb53 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_20/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where is the peach really? +Answer: blue_treasure_chest +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..061337b4d2f3dbbe86fb2ad06b000e8801de6df9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_20/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Avery really think the peach is? +Answer: blue_treasure_chest +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b4c2178ed400d0c6b74d68789c88648e9a48ad35 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_20/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Liam think Avery thinks the peach is? +Answer: red_bottle +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..05f87f468f23d411802db881f3cd2f0f4af3e4ad --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_20/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Benjamin think Liam thinks Avery thinks the peach is? +Answer: blue_treasure_chest +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5143dec5d4a281c1c4b91ad75c0cc7be920300fb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_20/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Hannah think Benjamin thinks Liam thinks Avery thinks the peach is? +Answer: red_basket +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a1bc06ec6e45ef0a538c05e9a06ef5da7b5de56b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_3/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where is the onion really? +Answer: red_drawer +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a49d86c42e865bbc9c3f6d2fa034ff619e445fc4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_3/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Lily really think the onion is? +Answer: red_drawer +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..29f8f9db410531102cf3d96085d63284b5b6f3ad --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_3/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Avery think Lily thinks the onion is? +Answer: red_drawer +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a81c07a875b7e40fa55b5ea48f2d809d99b8997e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_3/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Emily think Avery thinks Lily thinks the onion is? +Answer: blue_pantry +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..99834f8ab0d49c2b8a154c53c8735a9e0b8951c1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_3/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Elizabeth think Emily thinks Avery thinks Lily thinks the onion is? +Answer: blue_pantry +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9557c73c97ff271f87f70d9b19553d25b9c18c7c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_4/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where is the cherry really? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..02384e0a637e1ff040ba4ae1df7cc1d56d81269c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_4/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Jackson really think the cherry is? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4693236ee17fc64e259db52b1977c96970bc403c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_4/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Benjamin think Jackson thinks the cherry is? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8724f4b1400383de5cfb175f38a97b53cafafc4d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_4/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Mila think Benjamin thinks Jackson thinks the cherry is? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d286ae8f4bfae45efa9737020648bb1393a62d66 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_4/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Abigail think Mila thinks Benjamin thinks Jackson thinks the cherry is? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6e54802526dce951ad7707553f145f2317cbfe4b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_5/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where is the asparagus really? +Answer: blue_drawer +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..19ca2006bcb5d16bf0526deaa1aecc10dd36ab1b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_5/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Logan really think the asparagus is? +Answer: blue_drawer +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e9d21452280bd840054ac366a9678a8096b73201 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_5/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Sophia think Logan thinks the asparagus is? +Answer: red_crate +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6eca3d001fa0524013d5d91130c34a458544ef39 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_5/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Elizabeth think Sophia thinks Logan thinks the asparagus is? +Answer: blue_drawer +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..29555456c13b4da34c83945bf8164205a3ac799c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_5/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Hannah think Elizabeth thinks Sophia thinks Logan thinks the asparagus is? +Answer: blue_drawer +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..405e1e0bf22619ba28fab2c6e70591323b0147b4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_6/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where is the watermelon really? +Answer: green_basket +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ea8d9e84fae2fc058addcf0bbb1485378c0e9002 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_6/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does William really think the watermelon is? +Answer: green_basket +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3050846dfec765ed2f0c0c2afb99145fead11390 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_6/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does Carter think William thinks the watermelon is? +Answer: green_basket +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..3efdc2042a09ba5e799331f69e3ceeda621e23ad --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_6/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does Owen think Carter thinks William thinks the watermelon is? +Answer: green_envelope +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7a6e006997adb9d04c273642d6108e96038fdc2d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_6/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does Emma think Owen thinks Carter thinks William thinks the watermelon is? +Answer: green_envelope +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f31d3d6ac36c7d7f0f178f75171979d85e48e2b9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_7/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where is the tomato really? +Answer: green_drawer +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8152d7ffffc5daab69c143b1148ed4884f2b3c34 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_7/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Emma really think the tomato is? +Answer: green_drawer +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..dcf2ec30f8553268195f260275efcc386032d375 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_7/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Liam think Emma thinks the tomato is? +Answer: red_container +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f0044f4e3bb5a94d7fde189f5c54dca40b4daf6e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_7/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Hannah think Liam thinks Emma thinks the tomato is? +Answer: red_container +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..da8aae7cfd26748d6601265e67508a8ba4cd2ce2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_7/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Carter think Hannah thinks Liam thinks Emma thinks the tomato is? +Answer: red_container +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..57963f922fa02541ed47ef2a7e4a20a4818091e4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_8/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where is the lettuce really? +Answer: red_bucket +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5fa83fea27e255aabfb13474f86ba242112bb819 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_8/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Isla really think the lettuce is? +Answer: red_box +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..be72131d12dfeb02c1092ee267117c0a677711ef --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_8/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Benjamin think Isla thinks the lettuce is? +Answer: red_box +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..867597c6f65547ca7f06e213954fe3967c2c4a74 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_8/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Sophia think Benjamin thinks Isla thinks the lettuce is? +Answer: red_box +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1a4ee90a248f23d116a035a179fbb9791a94393b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_8/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Emily think Sophia thinks Benjamin thinks Isla thinks the lettuce is? +Answer: red_box +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c3c0316399089ccc4864eb51565bcc1caab26746 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_9/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where is the spinach really? +Answer: blue_suitcase +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..aaf77b73d86a757684f31e1752707dee2eb85d2c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_9/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Abigail really think the spinach is? +Answer: red_container +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c2cafe80555a95a84c5c5bf77f161d06bf457c3f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_9/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Owen think Abigail thinks the spinach is? +Answer: blue_suitcase +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e42a3d74dc7731741656bbac3f67dca8da203343 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_9/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Aiden think Owen thinks Abigail thinks the spinach is? +Answer: blue_suitcase +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..55b59775c165c59bd835373b73f601f4d8bd6d98 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_1/sample_9/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Jack think Aiden thinks Owen thinks Abigail thinks the spinach is? +Answer: blue_suitcase +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..858c9860e92fb17a9add37e715c5388b0d2e8721 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_1/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where is the persimmon really? +Answer: green_drawer +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..bb853f25e60995a6966feefe0176814e51ae838f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_1/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Owen really think the persimmon is? +Answer: blue_bottle +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ae1d61d457aad528e52df1253f40f8471588fb6c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_1/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Amelia think Owen thinks the persimmon is? +Answer: blue_pantry +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d4fd65b459fd937e092f5706e8613168443bb4b0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_1/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Aiden think Amelia thinks Owen thinks the persimmon is? +Answer: blue_pantry +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8cf06a4ac5d466a8d9d6154dd989c4031a4e70e9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_1/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Ella think Aiden thinks Amelia thinks Owen thinks the persimmon is? +Answer: blue_pantry +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f3475cb02a8d084aecb5ad83afc6942060b49163 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_10/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where is the persimmon really? +Answer: green_pantry +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a8dcfa54498258b295cf696870c1729ce615e68f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_10/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Ava really think the persimmon is? +Answer: blue_crate +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9a8a439fbc786cc7c69d393f1dadf55bad88282f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_10/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Evelyn think Ava thinks the persimmon is? +Answer: blue_crate +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..63511a3ff8a745e7486c12b9dbfe2026d9b13f8c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_10/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Charlotte think Evelyn thinks Ava thinks the persimmon is? +Answer: blue_crate +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a1a85ef9dbbb9b0e03396a3f4b2cc666880a3c41 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_10/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Benjamin think Charlotte thinks Evelyn thinks Ava thinks the persimmon is? +Answer: blue_crate +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fba769616ab8c98e4b4e224c2c98f4e06683d273 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_11/order_0.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where is the grapes really? +Answer: blue_pantry +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f27c9ec6d930644ba9c07158838865c3f18aed68 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_11/order_1.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Benjamin really think the grapes is? +Answer: blue_suitcase +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..eec5fa2875ae0b8b28a9f3cbe856d3e6fd0fb1b1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_11/order_2.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Liam think Benjamin thinks the grapes is? +Answer: blue_suitcase +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..763c6c5cf9b96b00d57caa4aa5be75281029ada7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_11/order_3.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Elizabeth think Liam thinks Benjamin thinks the grapes is? +Answer: blue_suitcase +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6d0599c26a443d0829f370614f0b4a851c718a79 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_11/order_4.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Alexander think Elizabeth thinks Liam thinks Benjamin thinks the grapes is? +Answer: blue_suitcase +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cd19e24a898e29af907e6ba4cc42bce476bab00 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_12/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where is the spinach really? +Answer: green_envelope +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..da8f9a43306f313d685511c3a15c57f31b5e34c6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_12/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Avery really think the spinach is? +Answer: blue_container +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3dfc668e87d11b03cc989d17abc65f1eebd256a9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_12/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Jackson think Avery thinks the spinach is? +Answer: blue_container +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4063180d6cb219ad65079a502413232ccaa15814 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_12/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Isabella think Jackson thinks Avery thinks the spinach is? +Answer: blue_container +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ef394690acc2097dde25fc8deeb079914dfc5565 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_12/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Nathan think Isabella thinks Jackson thinks Avery thinks the spinach is? +Answer: blue_container +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5877bec0ef6b26e98c1f277b91bd9bbdb83bca3c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_13/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where is the watermelon really? +Answer: red_container +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0640871b5b6f5c1bd96585ccc7c1340607886ec9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_13/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Jacob really think the watermelon is? +Answer: red_basket +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3433bccb0f8c6ef619c6ae1cbd12af48c942eb1f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_13/order_2.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Isla think Jacob thinks the watermelon is? +Answer: red_basket +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1576a8c95660e7f5018786b7cbc231c609a0f8a5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_13/order_3.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Logan think Isla thinks Jacob thinks the watermelon is? +Answer: red_container +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8e4f181735c4ad6c0aad2a33c37e33dae2398256 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_13/order_4.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Sophia think Logan thinks Isla thinks Jacob thinks the watermelon is? +Answer: red_container +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..452892aca5b3303b9371b2a9ebbbd5a630e635bc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_14/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where is the pear really? +Answer: blue_pantry +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..af67c2a82015482b71b124e8af44a363523c1604 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_14/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Nathan really think the pear is? +Answer: blue_pantry +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..cfd31fcdcffe0f3e687820f4a4398262b7754270 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_14/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Amelia think Nathan thinks the pear is? +Answer: green_bucket +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..53c08fc1468be44d3b99611e698d4e79fc72915f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_14/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Isabella think Amelia thinks Nathan thinks the pear is? +Answer: blue_pantry +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f5b635ed187795a17b731f7d949b17193c2d551b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_14/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Owen think Isabella thinks Amelia thinks Nathan thinks the pear is? +Answer: blue_pantry +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0e3cea5462c4364f1a0dbeb749a8a0eb6e12a43a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_15/order_0.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where is the potato really? +Answer: blue_crate +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f4305931e05ae9231d97f2a3d2dbd1bcbef6ce7a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_15/order_1.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Charlotte really think the potato is? +Answer: blue_cupboard +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..78fdd2167287ba5ee729d0e6314bf4a65777da36 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_15/order_2.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Noah think Charlotte thinks the potato is? +Answer: blue_cupboard +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4f4a501771776982c78d19814425818eecbe04f5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_15/order_3.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Ava think Noah thinks Charlotte thinks the potato is? +Answer: blue_cupboard +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..004962ded2b55350b1cfa431472d05fa166e6c46 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_15/order_4.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Nathan think Ava thinks Noah thinks Charlotte thinks the potato is? +Answer: blue_cupboard +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c467668e4dd45fdbccd44f9ac44ab4b75aa2dfcf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_16/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where is the cucumber really? +Answer: red_basket +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8fe289f01f72fdb7f18d73a49f3b714230a325e5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_16/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Benjamin really think the cucumber is? +Answer: red_container +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e511dba86ad0f247d3e24d7f9efd74d72857aab9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_16/order_2.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Charlotte think Benjamin thinks the cucumber is? +Answer: red_container +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c3b548650e5b85d6c507fe80e54fe58ef4f6ec56 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_16/order_3.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Evelyn think Charlotte thinks Benjamin thinks the cucumber is? +Answer: red_container +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..49844db8e9a569e4b5bc4cdddab2505ae6133207 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_16/order_4.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Isla think Evelyn thinks Charlotte thinks Benjamin thinks the cucumber is? +Answer: red_container +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5a7c8088eab1d746d3cac9dad25d67cc6c6d319a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_17/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where is the cherry really? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2fe7520a2d858f5a0a6291d40dccf7265c7bd5d9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_17/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Owen really think the cherry is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..56bf3d55efaaf67ec851e7a66c73c90e32b0e830 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_17/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Ella think Owen thinks the cherry is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..0d9f615c622277eabb82ad251bca45dd7c10543a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_17/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Abigail think Ella thinks Owen thinks the cherry is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8b7b4066fc85e24c22cb61d4bdfbfd0b2d3bfe56 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_17/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Emma think Abigail thinks Ella thinks Owen thinks the cherry is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e799456d4ab595f53a58395b979bdf125305a281 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_18/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where is the sweet_potato really? +Answer: red_container +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..82b2ec5d377b93838665200b64dab72e11b23cc3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_18/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Liam really think the sweet_potato is? +Answer: blue_container +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ea7fd809dbf11166c7937d69eb9a7c1fb85c2cfa --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_18/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Hannah think Liam thinks the sweet_potato is? +Answer: red_drawer +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..38ac4c9bedf59d89faff0ae3b89debf7874bf4d5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_18/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Evelyn think Hannah thinks Liam thinks the sweet_potato is? +Answer: red_drawer +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ce5e58f60036e4e339e13e199fb7583d8c1cfe2e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_18/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Emma think Evelyn thinks Hannah thinks Liam thinks the sweet_potato is? +Answer: red_drawer +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4dce15610af0dcacc22df3834ff3eca30efe0ebc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_19/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where is the carrot really? +Answer: blue_drawer +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba0003968a6e1d14b5ceecc048af84d341a9284e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_19/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Benjamin really think the carrot is? +Answer: blue_drawer +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6826a15d99e9ca133adaa8f96f22483ddbee8a15 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_19/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Noah think Benjamin thinks the carrot is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..dde2212a1550bba5b15a4682ea399886d66a78bd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_19/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Emily think Noah thinks Benjamin thinks the carrot is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..18b798a83a75102224d5b788d3ab599423d84b3a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_19/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Sophia think Emily thinks Noah thinks Benjamin thinks the carrot is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e117a95c0c832fc2930f9128ee4470184c66a7fa --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_2/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where is the onion really? +Answer: blue_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0ab9e75b73833a3bb3fd23e1c814fdc2c9cadbf1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_2/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Owen really think the onion is? +Answer: blue_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..04e8794cb755d178ec1ce3782751a666c2326adb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_2/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Emily think Owen thinks the onion is? +Answer: blue_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9ce7e8736c2adcf6644ba2ac720e2772f6e52006 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_2/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Isabella think Emily thinks Owen thinks the onion is? +Answer: red_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a846b37c368d94be43410476c7e482ddfc0b5cd5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_2/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Sophia think Isabella thinks Emily thinks Owen thinks the onion is? +Answer: red_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..85fd5920cd272c57979b7872468fe91be590eac5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_20/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where is the melon really? +Answer: blue_treasure_chest +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f9ad8643f628ec873acfd66e255da41034c9ca2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_20/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Jacob really think the melon is? +Answer: green_drawer +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..18fe6ecdd5154b883bbd6f39ba4492fef7437b9f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_20/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Lily think Jacob thinks the melon is? +Answer: blue_treasure_chest +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d16ad46a2bbcc7c1433c702b10a7189c99346f96 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_20/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Evelyn think Lily thinks Jacob thinks the melon is? +Answer: blue_treasure_chest +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..32117c96839104618c3d310126a8b5d2349e4423 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_20/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Ava think Evelyn thinks Lily thinks Jacob thinks the melon is? +Answer: blue_treasure_chest +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1849b6f393ad3045d1fb93b6ce93686d36f2c1fd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_3/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where is the peas really? +Answer: red_pantry +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e35274b2021d03ce26be88a0b1661aeae7f39eab --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_3/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Emma really think the peas is? +Answer: red_pantry +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f69ffd6c593277ccfd91c746160497aef7f48246 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_3/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Hannah think Emma thinks the peas is? +Answer: blue_treasure_chest +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..589e63db98c1d845a31ce8951468b138e9837f5a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_3/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Chloe think Hannah thinks Emma thinks the peas is? +Answer: blue_treasure_chest +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a82d2196686cbe654f3ae186c4d33001bb0bc9e6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_3/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Logan think Chloe thinks Hannah thinks Emma thinks the peas is? +Answer: blue_treasure_chest +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a15ce619ac9be4eb171b4bcddde3b464cc3755d5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_4/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where is the cherry really? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc6e24ba02e7dc878d49b3606d0b6931792f379d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_4/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does Nathan really think the cherry is? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f2219b54005bef09b096fa0d1706dd2bfef54dcd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_4/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does William think Nathan thinks the cherry is? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5411229ccb818d9b63e30264dba41580da88aaaf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_4/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does Ava think William thinks Nathan thinks the cherry is? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b10c3aad29166ce966f1dce1751d8b2c2722ded --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_4/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does Emma think Ava thinks William thinks Nathan thinks the cherry is? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..862d8d0a03ccfcae5e44b45dd9dbb5b7d3ad84a9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_5/order_0.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where is the watermelon really? +Answer: blue_container +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..901f102c0d8c4255d3d382b84167469d2cde3925 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_5/order_1.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Benjamin really think the watermelon is? +Answer: green_drawer +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2c8c3567285b28bad3fec501f1ae02e2750306ed --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_5/order_2.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Emma think Benjamin thinks the watermelon is? +Answer: green_drawer +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..98c4447401bfdaac018165b4c9309a810be4edf9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_5/order_3.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Isabella think Emma thinks Benjamin thinks the watermelon is? +Answer: green_drawer +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..73a118ec304304eb1141dc56c766bf5a8df849df --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_5/order_4.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Liam think Isabella thinks Emma thinks Benjamin thinks the watermelon is? +Answer: green_drawer +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..bc0f7513a82ea659ee2909981beca2439e3fbd56 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_6/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where is the peach really? +Answer: red_basket +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1d8441d6fde0d600c47f55f58e4668377b5232ee --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_6/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does Chloe really think the peach is? +Answer: green_bathtub +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..89129ac9734f65f59e9f43bba0c508b67648c6b9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_6/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does Isabella think Chloe thinks the peach is? +Answer: red_basket +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..46f2e059b71be6e0a4caf103d7f3e97c656bc639 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_6/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does Nathan think Isabella thinks Chloe thinks the peach is? +Answer: red_basket +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..87c0fb01b57e5721cf6b34d9445ddeb35b1f165a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_6/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does William think Nathan thinks Isabella thinks Chloe thinks the peach is? +Answer: red_basket +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..09d0afc48313a06713acc0ce01fdf3e317a044cc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_7/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where is the asparagus really? +Answer: green_treasure_chest +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2f0a0c307b23659a87a02fd7a343e4aff96ce453 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_7/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Aiden really think the asparagus is? +Answer: green_treasure_chest +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..81e494288818f62ddf23c49a59203f8b2fefbb12 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_7/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Emily think Aiden thinks the asparagus is? +Answer: green_treasure_chest +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d4e97ba84f68dcff7b3505de2790992cf98446c1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_7/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Avery think Emily thinks Aiden thinks the asparagus is? +Answer: green_treasure_chest +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad4ec058654eaffe4da81fd238d359eb63b065c1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_7/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Hannah think Avery thinks Emily thinks Aiden thinks the asparagus is? +Answer: green_treasure_chest +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3c8dd3f0310cdd57731dd70d586ddd38912dd130 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_8/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where is the lettuce really? +Answer: green_pantry +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..73e36e8b0d74370d02f84773780d410364ce2b7d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_8/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Isla really think the lettuce is? +Answer: green_pantry +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..489b026fbf5b425c9cf6e14eb1e8dc38d7c6bf18 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_8/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Charlotte think Isla thinks the lettuce is? +Answer: blue_bathtub +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6cb9798244c5e2ae1c997e22265be23c27d53cd2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_8/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Amelia think Charlotte thinks Isla thinks the lettuce is? +Answer: blue_cupboard +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6346795a8b1a2d799a969f6f48215996ceda4de3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_8/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Aiden think Amelia thinks Charlotte thinks Isla thinks the lettuce is? +Answer: blue_cupboard +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad3cc17a4f5eccba1fb5ae68a18ef6b500b01714 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_9/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where is the apple really? +Answer: green_bottle +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3a447480788fbf841c48f2e5a440b4114e458d9a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_9/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Jack really think the apple is? +Answer: green_bottle +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..248c698d212bb0dccf101a6b117fcc8980323594 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_9/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Evelyn think Jack thinks the apple is? +Answer: green_bottle +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..522e0d762bc9c0b352b1ea147df0dc93d93e4cfe --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_9/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Ella think Evelyn thinks Jack thinks the apple is? +Answer: green_pantry +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6da6acffdb31b6eb6bf39ae6e68367a14f05d8a6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_2/sample_9/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Amelia think Ella thinks Evelyn thinks Jack thinks the apple is? +Answer: green_pantry +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9044aef8400dad68a8981fe35a899788d45aeaa5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_1/order_0.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where is the peas really? +Answer: green_bottle +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ab570cc6bb7fbfee7441a10bb7846ddf6f347398 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_1/order_1.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Jack really think the peas is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ec0908437ddc37629db608ef28d1c9edde70808c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_1/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Jackson think Jack thinks the peas is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2206234a14b8c443d38f86aa03edc686a6824848 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_1/order_3.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Logan think Jackson thinks Jack thinks the peas is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9a8bd8f5870547fefe858565da7f0bcfb3282b08 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_1/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Isabella think Logan thinks Jackson thinks Jack thinks the peas is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6cf6f35e4c7831f36df7e773ea431688e44e68b5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_10/order_0.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where is the persimmon really? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1be06fd5af0498a0f2526796c472c80f16a21d3c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_10/order_1.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Mila really think the persimmon is? +Answer: green_bucket +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3f30627a9f6e20c9f944882dfc1ea668beba100c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_10/order_2.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Emily think Mila thinks the persimmon is? +Answer: red_envelope +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..75106b41522aa5e4b0dc118cdc089bb86c72b5f0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_10/order_3.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Charlotte think Emily thinks Mila thinks the persimmon is? +Answer: red_envelope +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f8f79628e25d25627e2b9a34b621cdad95700346 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_10/order_4.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Benjamin think Charlotte thinks Emily thinks Mila thinks the persimmon is? +Answer: red_envelope +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0b2cf9963c9f80c2148949bac2d4f11b5aca8dd6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_11/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where is the spinach really? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..19efa7b8d24afd269722a572f58b251eaec180e4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_11/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Abigail really think the spinach is? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7037ddfdb5d9f557b1e6255af16e2ffa9698e3a0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_11/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Benjamin think Abigail thinks the spinach is? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..53cf8d4dc891909e06a29718297f4935c025b1b9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_11/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Jack think Benjamin thinks Abigail thinks the spinach is? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a48878218fd48259cfe585a204fba8ee6bcb5d68 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_11/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Amelia think Jack thinks Benjamin thinks Abigail thinks the spinach is? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..41644fc5e834aa4723ec741941b84da81237ce48 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_12/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where is the spinach really? +Answer: green_pantry +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7dfc93a234a68f7986cbfccf27b6a7d120780c41 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_12/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Avery really think the spinach is? +Answer: green_pantry +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..aa667e43abb8be4ad1f8f3190c74fd7c4faf56de --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_12/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Hannah think Avery thinks the spinach is? +Answer: red_crate +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..0fe1da5de3e75e38c5013832f5213d7a3f5f42ff --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_12/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Isabella think Hannah thinks Avery thinks the spinach is? +Answer: green_pantry +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d6ddf29ad3bd5830aff3e8f0f1874a4ed16a25ef --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_12/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Nathan think Isabella thinks Hannah thinks Avery thinks the spinach is? +Answer: green_pantry +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8b9799e0c3b50386d7d1059e82dde65f6a02da6b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_13/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where is the onion really? +Answer: green_crate +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..bac8e4e4095f8acbef39f83250a081a6e393ec71 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_13/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Mila really think the onion is? +Answer: red_bucket +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3f333d9e1e91c54974ff70c6192d633c2c87090e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_13/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Abigail think Mila thinks the onion is? +Answer: red_bucket +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..3b60d4685269f9b4a394cd2ebf3296fd5e43dfa8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_13/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Jack think Abigail thinks Mila thinks the onion is? +Answer: green_crate +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0f8be0b670b54b2c35bb3dcce1577066fd1c7f3f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_13/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Emily think Jack thinks Abigail thinks Mila thinks the onion is? +Answer: green_crate +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f849150293984171e0f45fd42c4453657350bc5d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_14/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where is the carrot really? +Answer: green_crate +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..693c34aabf2e725283bb4353061dcdd62bb23f39 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_14/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Abigail really think the carrot is? +Answer: red_drawer +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..01a02b150b69753556cd0813122e062e089fe720 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_14/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Nathan think Abigail thinks the carrot is? +Answer: red_envelope +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..09f5b6843f096a6e39a90d42a08c5db0b0117978 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_14/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Avery think Nathan thinks Abigail thinks the carrot is? +Answer: red_envelope +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8b06eb9feb580f92cb6f6aeb69897bed80acdd3f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_14/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Isabella think Avery thinks Nathan thinks Abigail thinks the carrot is? +Answer: red_envelope +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f882923613a0835313bc855bda8a922fd9521cfc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_15/order_0.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where is the peach really? +Answer: red_pantry +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3cf2adc3c1320bcb6c2a01bf1d90d240cb93db90 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_15/order_1.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Abigail really think the peach is? +Answer: red_pantry +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..fb845625f5ab45579e53984bc7329726535c615d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_15/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Sophia think Abigail thinks the peach is? +Answer: red_bucket +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7807cb5325694c97e435eea99aa3521f5a4f40ac --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_15/order_3.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Aiden think Sophia thinks Abigail thinks the peach is? +Answer: red_bucket +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ff92e80411c0778ba98c72b1d2c1f0241566886f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_15/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Isla think Aiden thinks Sophia thinks Abigail thinks the peach is? +Answer: red_bucket +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..73cb19d17c347da550005e4e3a0474498765311d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_16/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where is the cherry really? +Answer: blue_cupboard +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..dc51116040827680c647a5bfe4107fe8196b441e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_16/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Aiden really think the cherry is? +Answer: blue_cupboard +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b705060770a9b3633b3466430d21c5c6f439162a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_16/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Noah think Aiden thinks the cherry is? +Answer: green_envelope +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..56c34d49cef5f43da8376ec96e548eb40a643d8d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_16/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Owen think Noah thinks Aiden thinks the cherry is? +Answer: blue_bucket +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..75694530380d3819f47c137e259a3e1fbe56e36a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_16/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Ella think Owen thinks Noah thinks Aiden thinks the cherry is? +Answer: blue_bucket +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6d956f8a4754c41ed89a7b1992d6203a27624ffa --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_17/order_0.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where is the turnip really? +Answer: green_crate +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7091bb5e35f449748c72df4aa45665b6151af2b3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_17/order_1.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does William really think the turnip is? +Answer: red_bottle +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..465115818a327cfa40a24f903a97cf28b3bbe342 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_17/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does Benjamin think William thinks the turnip is? +Answer: red_bottle +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..57dd3523990ac4d9bdd42224e7b041a6b44f986c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_17/order_3.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does Sophia think Benjamin thinks William thinks the turnip is? +Answer: green_crate +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3df33fc9a1f663e191d226881a5ce4fb0a18bcb4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_17/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does Liam think Sophia thinks Benjamin thinks William thinks the turnip is? +Answer: green_crate +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a3d43066f7213a033bd41c6b82a4f7f375bd8c9e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_18/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where is the cabbage really? +Answer: green_crate +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2d0bd869cf6bc69e0f035b9565bd5e9a288819ab --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_18/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does Carter really think the cabbage is? +Answer: green_crate +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..427aed8b66dc5795d0e6e107a98ee697feeeb0b2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_18/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does Avery think Carter thinks the cabbage is? +Answer: green_treasure_chest +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4165c15654891e66d4ff0b5ade87e15615f6b9ab --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_18/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does Aiden think Avery thinks Carter thinks the cabbage is? +Answer: green_bucket +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e9bc588b28f80dc1f9bba77e663961e27c3bfa6f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_18/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does William think Aiden thinks Avery thinks Carter thinks the cabbage is? +Answer: green_bucket +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3a1dcac1c0ca1ba948f54c1fbd705121baeaf259 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_19/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where is the cherry really? +Answer: blue_container +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e71737b282379d62bb979786ee4bbd2123131fa8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_19/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does William really think the cherry is? +Answer: green_basket +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2f659c2847d1fa6968ee93139e1339a3093709f9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_19/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does Ava think William thinks the cherry is? +Answer: green_basket +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b6ff68c268c9ce778ceb6a7955eee58bd204f1dc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_19/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does Logan think Ava thinks William thinks the cherry is? +Answer: blue_container +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d1067c911ccda93bf5439aece81489ec1f60f4f4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_19/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does Amelia think Logan thinks Ava thinks William thinks the cherry is? +Answer: blue_container +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7e126a6e254e8a3f04185480a0050b653ceb6a9c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_2/order_0.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where is the melon really? +Answer: blue_suitcase +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7d025ca4dbc2cd5a4bec2f358620a3fa4e15fe4b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_2/order_1.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Aiden really think the melon is? +Answer: blue_suitcase +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..41db3f32d94302685e41898636bb732f62fe19b2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_2/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Owen think Aiden thinks the melon is? +Answer: blue_suitcase +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..41d874b725301098256f3cc719174118069a4ac5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_2/order_3.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Ella think Owen thinks Aiden thinks the melon is? +Answer: blue_suitcase +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8b7b79794c74a55a99982348a5cc04868e06ad8e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_2/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Evelyn think Ella thinks Owen thinks Aiden thinks the melon is? +Answer: blue_treasure_chest +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e4c8d541e01238eba23923ca708413e834413324 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_20/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where is the turnip really? +Answer: red_envelope +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e0fb191d8431448d18f2547179820c6dbc5acc54 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_20/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Owen really think the turnip is? +Answer: blue_pantry +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..37f3b35a9c4ddb60dd84821950bee99142d482c2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_20/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Mila think Owen thinks the turnip is? +Answer: green_pantry +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..20b97b4d764b723728d8850e1db13ad70de0262e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_20/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Carter think Mila thinks Owen thinks the turnip is? +Answer: green_pantry +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..46939aff3f0a79b8d750dae1f97fe5b395ce4357 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_20/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Isla think Carter thinks Mila thinks Owen thinks the turnip is? +Answer: green_pantry +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ef311d94add03428065763d2cca94c087a9dc3b6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_3/order_0.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where is the spinach really? +Answer: green_crate +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..40802c01d29d7314a91e5a1bf8d5d729df892585 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_3/order_1.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Jacob really think the spinach is? +Answer: green_crate +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6c6ef07fad9c98bbbf7310fba7aa7258b091a2fe --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_3/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Jackson think Jacob thinks the spinach is? +Answer: green_crate +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6bcec76b5efc283b6d4a10c9a0d7187acc0f2310 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_3/order_3.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Jack think Jackson thinks Jacob thinks the spinach is? +Answer: green_crate +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..314b28b6a2828eb884139cd76c37b8ea6a60e8e8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_3/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Ella think Jack thinks Jackson thinks Jacob thinks the spinach is? +Answer: green_crate +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ea2075c0bcd30195fd863069d724b95c12476d7d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_4/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where is the corn really? +Answer: green_bottle +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..83b9aaee31e0e8ad48e77d5dc0730557bc64e05b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_4/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Amelia really think the corn is? +Answer: green_envelope +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e605c909752d015bb62de9d24623ee1d8bcdc977 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_4/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Nathan think Amelia thinks the corn is? +Answer: green_bottle +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..544e9bf063d55e795a464545b6e4c70c75a0108e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_4/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Lily think Nathan thinks Amelia thinks the corn is? +Answer: red_envelope +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7db11a2a907789770797b28ddffe3f5b1011560c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_4/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Alexander think Lily thinks Nathan thinks Amelia thinks the corn is? +Answer: red_envelope +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f2734a3917ec54359d6ea0c3a8a2468c084f2507 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_5/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where is the sweet_potato really? +Answer: red_box +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e1da93f2a00b67db3e7eaf892c8a043831d2c61b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_5/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Sophia really think the sweet_potato is? +Answer: red_box +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c4e4fb71dc21b39e1862e04ac7beb9af344578ce --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_5/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Jackson think Sophia thinks the sweet_potato is? +Answer: red_box +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4acd0366147b215901a0af7cfaa66474fb1e2c81 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_5/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Avery think Jackson thinks Sophia thinks the sweet_potato is? +Answer: green_bottle +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c72398d8cba8e51286467a08ebc3d51976ea9798 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_5/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Hannah think Avery thinks Jackson thinks Sophia thinks the sweet_potato is? +Answer: green_bottle +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3e9d8246bf40529668e25c28e050f2cd3aed17a0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_6/order_0.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where is the orange really? +Answer: blue_bucket +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b959f7ecef384d563d709df077cc87a81e2dd2b0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_6/order_1.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Owen really think the orange is? +Answer: red_container +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e6bfffee885e86b32fae30064fe69860cdc77128 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_6/order_2.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Isabella think Owen thinks the orange is? +Answer: red_container +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..eb235ff29d6b7368be0095192908cce9713d3a58 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_6/order_3.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Jacob think Isabella thinks Owen thinks the orange is? +Answer: blue_bottle +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4456a0a09fac3c137ee63a2f87791b244825a0fb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_6/order_4.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Hannah think Jacob thinks Isabella thinks Owen thinks the orange is? +Answer: green_box +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..524c5610c68714f9189bc6f41fccb56708f986fa --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_7/order_0.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where is the lime really? +Answer: green_bottle +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e615fba118fa1952e58988333df42c87d19777a8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_7/order_1.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Amelia really think the lime is? +Answer: green_envelope +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..19134a858e8eab03f79b2dd2ded0749ca9e1dfa6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_7/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Sophia think Amelia thinks the lime is? +Answer: green_envelope +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..993242bf8305792b1dde8714210fa39d49c88026 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_7/order_3.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Chloe think Sophia thinks Amelia thinks the lime is? +Answer: green_envelope +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8ed56a0a14cb2edfc8f680c376de64cde3e17c71 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_7/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Isabella think Chloe thinks Sophia thinks Amelia thinks the lime is? +Answer: blue_crate +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..581514cb013d1a609dcac8989af0c69453dac0df --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_8/order_0.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where is the carrot really? +Answer: red_pantry +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6d7bf17b9dfbd404a9d1c2311a090157edcc69fe --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_8/order_1.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Chloe really think the carrot is? +Answer: green_box +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..92500356751dc81c98ae31e789ecfcc240180649 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_8/order_2.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Amelia think Chloe thinks the carrot is? +Answer: red_bucket +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..13ea568dfb6a387eff9c0da9d716290594caf3d4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_8/order_3.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Avery think Amelia thinks Chloe thinks the carrot is? +Answer: red_bucket +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3cffcd366bf7bbba35c6ffabb5f5702eb54c4fed --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_8/order_4.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Sophia think Avery thinks Amelia thinks Chloe thinks the carrot is? +Answer: red_bucket +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..50d12098c9b8e2e00f67e6c9e3e2b146ff931231 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_9/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where is the watermelon really? +Answer: blue_container +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..47c913d4a5edb366cd4063a69506e24239cf36e3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_9/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Isla really think the watermelon is? +Answer: blue_cupboard +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f22c5f1113e3ece5f55394ba456e44c8fc99bd1b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_9/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Carter think Isla thinks the watermelon is? +Answer: blue_container +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..da1d196880d291705b50a38ae6dfdb439dc3498a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_9/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Elizabeth think Carter thinks Isla thinks the watermelon is? +Answer: red_envelope +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3a7e39eadfa95a70660fa11e9978ff5e44e0c0c3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/CoT/length_3/sample_9/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Nathan think Elizabeth thinks Carter thinks Isla thinks the watermelon is? +Answer: blue_bottle +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c3f043ebabe2f854c2cb96ec777fe4ab9c8ad24f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_1/order_0.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where is the carrot really? +Answer: red_basket +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2bb34f93fdff8b15862da83b0a542d06211aec89 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_1/order_1.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does William really think the carrot is? +Answer: green_envelope +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2eb5b3c46b11e21b158d39fb37642c30aa5c587f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_1/order_2.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does Hannah think William thinks the carrot is? +Answer: red_basket +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..3cabe88dd8d270f42313894d791287a16f2f19c0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_1/order_3.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does Jack think Hannah thinks William thinks the carrot is? +Answer: red_basket +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7f711b4bab49773e1e83866d274e9b8e9dc9da29 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_1/order_4.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does Charlotte think Jack thinks Hannah thinks William thinks the carrot is? +Answer: red_basket +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..bd5e45f2475c310ef9b00d45fda45213074b3225 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_10/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where is the potato really? +Answer: green_cupboard +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b3cb78a0a24a7a81117c16aa2531c95193568b6f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_10/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Carter really think the potato is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7bd8553aa766144060b47594a79be68191b557e4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_10/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Jacob think Carter thinks the potato is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9a9d0f9270a51954ade2cfb75c0c35b8c0d2cb3f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_10/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Alexander think Jacob thinks Carter thinks the potato is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..226ecca2dda1f12e3a323d8b7e64fc8508e964a1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_10/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Jackson think Alexander thinks Jacob thinks Carter thinks the potato is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..952b2e18173a697607a2dc2b631573973dba121a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_11/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where is the pear really? +Answer: red_pantry +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cf30a6402ff86513e79584bd5ce149de686c9070 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_11/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Sophia really think the pear is? +Answer: red_pantry +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4fbd1613b47d8868338034b627cdea1ed5c11cd8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_11/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Ava think Sophia thinks the pear is? +Answer: blue_crate +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e237cd620b9d5eec6ce038365b858b8babbaeadb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_11/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Avery think Ava thinks Sophia thinks the pear is? +Answer: blue_crate +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..de52a67c8dac88951109fedce63548312f6c47fb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_11/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Mila think Avery thinks Ava thinks Sophia thinks the pear is? +Answer: blue_crate +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e2385e9cd4b8b708cd18a096a58216f488c9318c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_12/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where is the tangerine really? +Answer: red_basket +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b2ebf8b1ada253679adf0a099b35ca9a33adee5d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_12/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Ava really think the tangerine is? +Answer: red_basket +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..97c2258cf9596c903f4233a62e74276cc5fcc498 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_12/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Logan think Ava thinks the tangerine is? +Answer: red_bottle +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..03ecfeda4a2c39bddac96ce1298828fbf31b3da7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_12/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Owen think Logan thinks Ava thinks the tangerine is? +Answer: red_bottle +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..afc2e64ae6123ab4625a4c1e9545e2a1337ccfb5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_12/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Elizabeth think Owen thinks Logan thinks Ava thinks the tangerine is? +Answer: red_bottle +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4a107ab14038071ad6abc836442c44311b73336c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_13/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where is the onion really? +Answer: red_crate +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c17c1f2065ea2d0b1f88e09ceeb239b64b477e46 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_13/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Owen really think the onion is? +Answer: red_crate +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7e4f2d6727ccff5638351556d30d4788e1c6325e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_13/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Elizabeth think Owen thinks the onion is? +Answer: red_crate +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e7c238ad346a30f94d09d06c579cac23c15b864c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_13/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Liam think Elizabeth thinks Owen thinks the onion is? +Answer: red_crate +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..701c59836deaf4c517823d48c818ea6c3e7597c4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_13/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Noah think Liam thinks Elizabeth thinks Owen thinks the onion is? +Answer: red_crate +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a8ecc5b886403be84bd6f7bff3b3852a91f27805 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_14/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where is the tangerine really? +Answer: green_treasure_chest +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..42df25516771a0e4df2b012ed608cf7bf809fc9f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_14/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Mila really think the tangerine is? +Answer: red_box +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f784df5024da7aaa0e34841146aae2f73725fbc0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_14/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Amelia think Mila thinks the tangerine is? +Answer: red_box +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b4e3f6330f4d321d221475798cf11b4a54de9cfa --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_14/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Elizabeth think Amelia thinks Mila thinks the tangerine is? +Answer: green_treasure_chest +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..67d082a267ba974e7c5a808ad0fdcf5a68b270f8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_14/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Chloe think Elizabeth thinks Amelia thinks Mila thinks the tangerine is? +Answer: green_treasure_chest +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..14db8fce2936a9e7de8fd3e22f8ead4bf6340ef1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_15/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where is the tangerine really? +Answer: red_basket +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1bb84de67b9e27f39bc192c911c996ebaed39634 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_15/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Amelia really think the tangerine is? +Answer: green_bottle +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..14260ae287cbbf0476bb0ea91ca92563061d35cf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_15/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Ava think Amelia thinks the tangerine is? +Answer: red_basket +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a35e1f3abf3df9d760ef91f1a73daae8f2388a82 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_15/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Carter think Ava thinks Amelia thinks the tangerine is? +Answer: red_basket +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..85d4b31c225a08bd7fd0752e7fe1950a709a0259 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_15/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Abigail think Carter thinks Ava thinks Amelia thinks the tangerine is? +Answer: red_basket +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1745cf1b3d0468811c31320577e7d54e3ba6b930 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_16/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where is the tomato really? +Answer: red_crate +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f55acb16bd3866cc2f9c08025f6a72089be50333 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_16/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Jack really think the tomato is? +Answer: green_box +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..535361a81ed239391129a4d945efa5a258c50e68 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_16/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Isla think Jack thinks the tomato is? +Answer: green_basket +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..3cf43da6bd87e04ed835854328efd7c447055130 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_16/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Carter think Isla thinks Jack thinks the tomato is? +Answer: red_crate +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc2ece1f1c54e42adc9a3915c7ab414c4a98b76d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_16/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Aiden think Carter thinks Isla thinks Jack thinks the tomato is? +Answer: red_crate +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..02f4d5b78d0b8d4ca5382b1d4f482bbd6774f8c2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_17/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where is the green_pepper really? +Answer: blue_treasure_chest +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..bbf585b2b24f10f5be33565478dcc3519ac9b331 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_17/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Alexander really think the green_pepper is? +Answer: blue_crate +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..bc1eb15a37df6978610ca29db2f7d834e90c9703 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_17/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Evelyn think Alexander thinks the green_pepper is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..41f4bff6d7a275334408261136d0484a94491eea --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_17/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Hannah think Evelyn thinks Alexander thinks the green_pepper is? +Answer: blue_crate +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5968440a091c06c44ecc07396e87c33b5f285e40 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_17/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Abigail think Hannah thinks Evelyn thinks Alexander thinks the green_pepper is? +Answer: blue_crate +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..955868c4aa2907af3ed9a6cd7eecbc64df7ccc3f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_18/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where is the cabbage really? +Answer: red_box +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4cc4e3b27b50c38322259abe40b26bf2c15f7d7a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_18/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does William really think the cabbage is? +Answer: red_box +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..70cc0fba59839e146e2560b7d6a26458e138fb53 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_18/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does Nathan think William thinks the cabbage is? +Answer: green_pantry +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..098867596118f526ef6ba999963b59fa1ee2aaa8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_18/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does Aiden think Nathan thinks William thinks the cabbage is? +Answer: red_bucket +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7c740ca4448211e491ac2e7cd3aa767da0751333 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_18/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does Logan think Aiden thinks Nathan thinks William thinks the cabbage is? +Answer: red_bucket +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5daa53543219d660073586eafad9e2c0486397a7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_19/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where is the green_pepper really? +Answer: blue_crate +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a74d35a521d3309ae1563886d36023fca21cd57c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_19/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Logan really think the green_pepper is? +Answer: blue_crate +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4220ff9187a0c40a9b276c02da7c325ae78bb078 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_19/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Lily think Logan thinks the green_pepper is? +Answer: red_drawer +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..08dca328066f9b8b633c625ae462d23c8970c36f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_19/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Ella think Lily thinks Logan thinks the green_pepper is? +Answer: red_drawer +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8b20fe3624c909ea02ee8a36d415b317c663296c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_19/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Elizabeth think Ella thinks Lily thinks Logan thinks the green_pepper is? +Answer: red_drawer +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c19a9610045a95546efa24d05ae95167524fc901 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_2/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where is the lemon really? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d6adc5baa9dbe7cee98d49acd3b51da71fae7498 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_2/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Lily really think the lemon is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..36a5438bf2d2e7d5d2901a2d967c3f142b7b700e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_2/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Avery think Lily thinks the lemon is? +Answer: blue_treasure_chest +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b2b0e313a830679c1130f347f4dd84032b662c21 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_2/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Liam think Avery thinks Lily thinks the lemon is? +Answer: blue_treasure_chest +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..018d8e3b82b0912fa3a9d663f91dfbf67417053a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_2/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Noah think Liam thinks Avery thinks Lily thinks the lemon is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..dad67d58c820dc04d07524e3d7682d6513b69f7e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_20/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where is the peach really? +Answer: blue_treasure_chest +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..567f2d30b2828bc44122c5db103e1ea600f4165c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_20/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Avery really think the peach is? +Answer: blue_treasure_chest +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e18b436738a236ac17f678f4aeaf51ec4b7d572b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_20/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Liam think Avery thinks the peach is? +Answer: red_bottle +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..219f1a4d304e5c95995d935cc1602846d147743c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_20/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Benjamin think Liam thinks Avery thinks the peach is? +Answer: red_basket +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2a0ad6a744a70d4cfb799d3ad908c95987e6d471 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_20/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Hannah think Benjamin thinks Liam thinks Avery thinks the peach is? +Answer: red_basket +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3058f65ebfd451a38924ca522538b7b145397691 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_3/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where is the onion really? +Answer: red_drawer +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e097b40397d68defda50b8ddc8b26699879f3db3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_3/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Lily really think the onion is? +Answer: red_drawer +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f7edbde33e1d995bfcf97f6a437b12a7fc4568fe --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_3/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Avery think Lily thinks the onion is? +Answer: red_drawer +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9d582dad3fadd3d92b93a911859e59633f8df86b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_3/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Emily think Avery thinks Lily thinks the onion is? +Answer: green_crate +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a4b4339a33ad34e7f8c91af2da0052d3a7bcb838 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_3/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Elizabeth think Emily thinks Avery thinks Lily thinks the onion is? +Answer: green_crate +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3828290eec24c8c5cd83c18f09e049c51057e579 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_4/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where is the cherry really? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba7be809027c37c1373acfcf3f3b41bdd134c51e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_4/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Jackson really think the cherry is? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7523eaf40aa277dccaf78a1be78c396a6faa0d52 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_4/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Benjamin think Jackson thinks the cherry is? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..85411bd4b147390ff534b94a94c36e506315c63e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_4/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Mila think Benjamin thinks Jackson thinks the cherry is? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e11a19b9e86caa70d9445663139149204832042f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_4/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Abigail think Mila thinks Benjamin thinks Jackson thinks the cherry is? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..aff696cfbf7098c3b9251170527e9bb3ddaa1e22 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_5/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where is the asparagus really? +Answer: blue_drawer +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3e7aa4805ba8c62f130dbdb6c80f74d337d7eef4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_5/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Logan really think the asparagus is? +Answer: blue_drawer +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8b211668f7413be8cd8953302961924e44136612 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_5/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Sophia think Logan thinks the asparagus is? +Answer: red_crate +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..bbd8cfbc2394369b6db07397267c18db60e238ac --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_5/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Elizabeth think Sophia thinks Logan thinks the asparagus is? +Answer: blue_drawer +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7a913a46d45a74dc5fdf0bbda001c0978de8307a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_5/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Hannah think Elizabeth thinks Sophia thinks Logan thinks the asparagus is? +Answer: blue_drawer +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1f5050187596716ce3800410353d034fcb38c5d6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_6/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where is the watermelon really? +Answer: green_basket +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3f74243ac87faaf3bc2c2ee3f4be4ee7af27b4fa --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_6/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does William really think the watermelon is? +Answer: green_basket +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e39433f1e1382d5c9d3e99a98919b90886b56590 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_6/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does Carter think William thinks the watermelon is? +Answer: green_basket +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5edafc8151b0da56251e47fc7c22b9b7cac1312b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_6/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does Owen think Carter thinks William thinks the watermelon is? +Answer: green_crate +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2638043bb0355d39264d9ad831c016d0f855b180 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_6/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does Emma think Owen thinks Carter thinks William thinks the watermelon is? +Answer: green_crate +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..87e6747447969ed4c9c88655afc32cc54fcd4f7f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_7/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where is the tomato really? +Answer: green_drawer +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d38bdcddd4b7125e2408168613be7cf95ed8bdd4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_7/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Emma really think the tomato is? +Answer: green_drawer +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..99b0fc1761141465d6d1ef177b9e6a0c0ec4b29f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_7/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Liam think Emma thinks the tomato is? +Answer: red_container +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2c8a01a99b52200f755d28e37df63f77c227f202 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_7/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Hannah think Liam thinks Emma thinks the tomato is? +Answer: red_container +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..16bb8702a200bd3c0d1c2490655ced175ef6c326 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_7/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Carter think Hannah thinks Liam thinks Emma thinks the tomato is? +Answer: red_container +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b652f760a0aea510dfc044e8e94f928f3e621db9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_8/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where is the lettuce really? +Answer: red_bucket +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..bf0b7e7497fdb2b09d77c654a1843230480d2f42 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_8/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Isla really think the lettuce is? +Answer: red_box +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1f750caf8be7c61e71e7223da9ab0081cafe9d85 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_8/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Benjamin think Isla thinks the lettuce is? +Answer: red_bucket +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..57340ad7fe7bddc9f1919f052d3ad2d5c2efd85e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_8/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Sophia think Benjamin thinks Isla thinks the lettuce is? +Answer: red_bucket +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8eab80c3c70c9469980ded0c304b0f6920b22deb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_8/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Emily think Sophia thinks Benjamin thinks Isla thinks the lettuce is? +Answer: red_bucket +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a49755a8403cddc0aa28d294298e3b6821aec8f1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_9/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where is the spinach really? +Answer: blue_suitcase +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c2d88c415c0d1c2c9713d9b44224acfecfeb22be --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_9/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Abigail really think the spinach is? +Answer: red_container +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f143a88d7c4733bbc38e0fce09b4af5a702f6f6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_9/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Owen think Abigail thinks the spinach is? +Answer: blue_suitcase +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7eb67397304f2d72b1bea7fbc3cab62250f860be --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_9/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Aiden think Owen thinks Abigail thinks the spinach is? +Answer: blue_suitcase +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..033069e46a3a097933fdfb1f01e569ec9f4c1e85 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_1/sample_9/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Jack think Aiden thinks Owen thinks Abigail thinks the spinach is? +Answer: blue_suitcase +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..34174b7cb4aa5b66ea5c0db35bc2450ee242249c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_1/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where is the persimmon really? +Answer: green_drawer +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b54a82ccefba259db575d46a9c061a77f7d699ec --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_1/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Owen really think the persimmon is? +Answer: blue_bottle +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d54866a84bbe7eef03049253be38525e258490fb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_1/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Amelia think Owen thinks the persimmon is? +Answer: blue_pantry +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ab8106a9364a4db5dbe40fbb156408eb0554c8d1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_1/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Aiden think Amelia thinks Owen thinks the persimmon is? +Answer: blue_pantry +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c62bb3088315ed4996e737507e8aae6d70662d23 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_1/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Ella think Aiden thinks Amelia thinks Owen thinks the persimmon is? +Answer: blue_pantry +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1717dcbd3369347b0be5a8d6b854f3ad0732d5de --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_10/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where is the persimmon really? +Answer: green_pantry +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8e751d92d94394e560d5480cee851772f57586b1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_10/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Ava really think the persimmon is? +Answer: blue_crate +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..524590c4226f239ea322f5c1d93fcf3be05eae15 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_10/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Evelyn think Ava thinks the persimmon is? +Answer: blue_crate +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..3217b27e553500664dda83e099fcfc59d9bfd896 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_10/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Charlotte think Evelyn thinks Ava thinks the persimmon is? +Answer: blue_crate +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1d77ad280d9ef43ac7664342228640f47f9fe7ca --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_10/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Benjamin think Charlotte thinks Evelyn thinks Ava thinks the persimmon is? +Answer: blue_crate +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b156e89c941601de3c62bf4c98e8ab3ce4a65ff --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_11/order_0.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where is the grapes really? +Answer: blue_pantry +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..71541d7306df86d0167a524961c4bb9c0a09c990 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_11/order_1.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Benjamin really think the grapes is? +Answer: blue_suitcase +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d2e78c30d00adf4fda68e08c7e967baa79c376dd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_11/order_2.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Liam think Benjamin thinks the grapes is? +Answer: blue_suitcase +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..41dca417e04d7158596d6666fcb98343be5b5605 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_11/order_3.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Elizabeth think Liam thinks Benjamin thinks the grapes is? +Answer: blue_pantry +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..fb25f8b04df820da62ec55489569c5f24be10910 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_11/order_4.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Alexander think Elizabeth thinks Liam thinks Benjamin thinks the grapes is? +Answer: blue_pantry +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..166e4bd29650e0c67a60c31cd0b2cc845579c8da --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_12/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where is the spinach really? +Answer: green_envelope +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cf51325c5901031843d410f8cd68a95cbe5a0517 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_12/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Avery really think the spinach is? +Answer: blue_container +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d8548e97a569db44a2aa4771ca41886ab2cbf717 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_12/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Jackson think Avery thinks the spinach is? +Answer: green_envelope +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..fe221ebaa132c268f92c15d3f4c8c34ef4070b09 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_12/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Isabella think Jackson thinks Avery thinks the spinach is? +Answer: green_envelope +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..74baa2be8dff8d5a6e7db473b4ac52c5a84adbb2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_12/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Nathan think Isabella thinks Jackson thinks Avery thinks the spinach is? +Answer: green_envelope +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d75280a0e7cf017d2a2b0243607d7f5562bb4359 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_13/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where is the watermelon really? +Answer: red_container +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a8abe4a1f02bbeb5c0db79846c739a3a95551637 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_13/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Jacob really think the watermelon is? +Answer: red_basket +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2870b752df2d83c0fc3d22382b8e48a32a8dbe3c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_13/order_2.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Isla think Jacob thinks the watermelon is? +Answer: red_basket +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..13f52dcc44b907abd09efd575fc2cc4c59e0667e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_13/order_3.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Logan think Isla thinks Jacob thinks the watermelon is? +Answer: red_container +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..35495b9b9fc9773f26200dc39919256c72e4b589 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_13/order_4.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Sophia think Logan thinks Isla thinks Jacob thinks the watermelon is? +Answer: red_container +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e3eff30bfd5448b3308b6d9070317d2f96c716df --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_14/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where is the pear really? +Answer: blue_pantry +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..701f45c1e9dcdb85bb25394c85e487b159cf0efd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_14/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Nathan really think the pear is? +Answer: blue_pantry +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..26efa0e4685ac08700ba333944a72e82aa8c6448 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_14/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Amelia think Nathan thinks the pear is? +Answer: blue_pantry +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ae074a40c8d25b2eeee9dc5bc71a35fad20caf6d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_14/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Isabella think Amelia thinks Nathan thinks the pear is? +Answer: blue_pantry +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b202d8d040a369570d1087b14bedb74cef8aa838 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_14/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Owen think Isabella thinks Amelia thinks Nathan thinks the pear is? +Answer: blue_pantry +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..efd72faf701182e02de8fe0d2afa8af04da8b481 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_15/order_0.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where is the potato really? +Answer: blue_crate +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..25fd723573345796a2e93f4100148dac5f68e681 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_15/order_1.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Charlotte really think the potato is? +Answer: blue_cupboard +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..29042c7a397d666c68716f41ff85a4b80d196694 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_15/order_2.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Noah think Charlotte thinks the potato is? +Answer: blue_cupboard +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8b1d7f4ed819ac9547609d2ea94b00ec709eaa46 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_15/order_3.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Ava think Noah thinks Charlotte thinks the potato is? +Answer: blue_cupboard +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..130b97bc7f0f88a0c3964d282d1a1d74549a5f38 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_15/order_4.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Nathan think Ava thinks Noah thinks Charlotte thinks the potato is? +Answer: blue_cupboard +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..13121aa11c0fc217386f0b1bb4ee6067ba1fa63a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_16/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where is the cucumber really? +Answer: red_basket +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7d13e49cb83fad64d899fefaed31de1695adb755 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_16/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Benjamin really think the cucumber is? +Answer: red_container +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..10fe089fb05d138895ad9f16ee91dc9d14b7be73 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_16/order_2.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Charlotte think Benjamin thinks the cucumber is? +Answer: red_container +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..288ecc768a4186ca8890d5e55e56a2c65111f667 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_16/order_3.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Evelyn think Charlotte thinks Benjamin thinks the cucumber is? +Answer: green_crate +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c890569cc6c3c504a384fc79a5171150b766c67b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_16/order_4.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Isla think Evelyn thinks Charlotte thinks Benjamin thinks the cucumber is? +Answer: green_crate +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3def8a9d44d1cc6a31c6179ae8b06b262b2d805d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_17/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where is the cherry really? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b9fdfe164d4f0ecc23b62412182de006776b8b24 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_17/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Owen really think the cherry is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..fe585eed3f5f3fd1059d82b79fe07d48db1f8f31 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_17/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Ella think Owen thinks the cherry is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..144b9967186df48e501fb77ae44a167876140c9d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_17/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Abigail think Ella thinks Owen thinks the cherry is? +Answer: red_drawer +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..62cd414d206c0d2386ecb255bb8201c9bb93f62a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_17/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Emma think Abigail thinks Ella thinks Owen thinks the cherry is? +Answer: red_drawer +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d833839fdf98b4110233a8025ec9686d450d9b5d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_18/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where is the sweet_potato really? +Answer: red_container +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a84328cb7acc27d0dbc2ffdd429b2644e5e424ad --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_18/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Liam really think the sweet_potato is? +Answer: blue_container +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..260d1a8890fe4b6748c56b77f1d03e3c99bc5744 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_18/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Hannah think Liam thinks the sweet_potato is? +Answer: red_drawer +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d34772c2fcf58f4521af1b51eb5b10fb6317d697 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_18/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Evelyn think Hannah thinks Liam thinks the sweet_potato is? +Answer: red_drawer +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad840801d89943b1c94902ffc90ceec840a6969e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_18/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Emma think Evelyn thinks Hannah thinks Liam thinks the sweet_potato is? +Answer: red_drawer +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a913d2b0f4952740eae0ef8e5ebd2488bcaec1ee --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_19/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where is the carrot really? +Answer: blue_drawer +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a442ab3e5baf541751c7802e4becdc713cd9bcb6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_19/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Benjamin really think the carrot is? +Answer: blue_drawer +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..88a4fb182cc87168d8b2667b3db9735b2e6f5ef8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_19/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Noah think Benjamin thinks the carrot is? +Answer: blue_drawer +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f22aacc55fe6f42bb4692c69aadd84e50b204e14 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_19/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Emily think Noah thinks Benjamin thinks the carrot is? +Answer: blue_drawer +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..eb44267faf9486ede114c7b9a835f869854f4ac6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_19/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Sophia think Emily thinks Noah thinks Benjamin thinks the carrot is? +Answer: green_treasure_chest +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..859bec66a7d4d17ee4ec011e0f167804a65c219f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_2/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where is the onion really? +Answer: blue_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f21d3493ae7103fc945225db5db313cfc0917b4c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_2/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Owen really think the onion is? +Answer: blue_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8538b3958d04a1ddf0aca01e1e2c32e3a6638d3e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_2/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Emily think Owen thinks the onion is? +Answer: blue_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e8474374c6089eb6a90194a09f5254780ceee78a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_2/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Isabella think Emily thinks Owen thinks the onion is? +Answer: red_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f6f4e82481c473bdfcf529fb1e118bbc9067c3d7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_2/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Sophia think Isabella thinks Emily thinks Owen thinks the onion is? +Answer: red_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca495b961020f17be0167dd3d7aab8a0863042f9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_20/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where is the melon really? +Answer: blue_treasure_chest +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9bbc21cefb445300f577d07b86e3433c846f64be --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_20/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Jacob really think the melon is? +Answer: green_drawer +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..39b5f195b9e1f3858fcc777b15c4f76a9fabea37 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_20/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Lily think Jacob thinks the melon is? +Answer: blue_treasure_chest +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a188f47b887b9d229153b15f65577e6d6014f665 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_20/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Evelyn think Lily thinks Jacob thinks the melon is? +Answer: blue_treasure_chest +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..676b28fa7cfc85b0bfaa67760159b7c1982a39b0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_20/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Ava think Evelyn thinks Lily thinks Jacob thinks the melon is? +Answer: blue_treasure_chest +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b5da1fdca4ff6f02ecf001e153540431611a6b0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_3/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where is the peas really? +Answer: red_pantry +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0879ad99148e23480d5395c5e605e43f62acd30b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_3/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Emma really think the peas is? +Answer: red_pantry +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6e8113c99f9ed39a4e8b2809a49f2a036b068794 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_3/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Hannah think Emma thinks the peas is? +Answer: red_bottle +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5ef68896d863c6842c2d38f81e476edb8f36793c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_3/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Chloe think Hannah thinks Emma thinks the peas is? +Answer: red_bottle +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..887c5f4fef7fa391d78847120fb0d717a2fa896a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_3/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Logan think Chloe thinks Hannah thinks Emma thinks the peas is? +Answer: red_bottle +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b8254e289a0ee9a2c9e7645bfe161aedb1535dbe --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_4/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where is the cherry really? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0471d90ef7f389fb34959227509f89e175a1b75e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_4/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does Nathan really think the cherry is? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b6c6528ceb5a36c18b74444040088b37adddf1c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_4/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does William think Nathan thinks the cherry is? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f319e4386da4428147452765af55b5d936ea2a0a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_4/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does Ava think William thinks Nathan thinks the cherry is? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..146da7f67e2656236461bbb3d58818d1b467c493 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_4/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does Emma think Ava thinks William thinks Nathan thinks the cherry is? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4ec1180e798c28793ba75beec661fb2c38213b57 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_5/order_0.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where is the watermelon really? +Answer: blue_container +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3e397106fea04a7aa61c189fe7511062b4ffe9cd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_5/order_1.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Benjamin really think the watermelon is? +Answer: green_drawer +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5fbc60269b2eec828cb7a7435ad7fa6b8c39f18e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_5/order_2.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Emma think Benjamin thinks the watermelon is? +Answer: green_drawer +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..90bdab10db989eb4cb51af2a1885b37fa6034ff9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_5/order_3.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Isabella think Emma thinks Benjamin thinks the watermelon is? +Answer: green_drawer +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d38685cff25a34b8707c899f581610e42afd42a3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_5/order_4.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Liam think Isabella thinks Emma thinks Benjamin thinks the watermelon is? +Answer: blue_bottle +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b7737b25ea6f4f9ffd3276209db4c602dd1bf753 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_6/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where is the peach really? +Answer: red_basket +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..402718a54ff715d4c007326c22b6fc2fe247932d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_6/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does Chloe really think the peach is? +Answer: green_bathtub +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..32e2a23de0721dab91498d16ee1e802ec26353e5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_6/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does Isabella think Chloe thinks the peach is? +Answer: red_basket +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..092242651570017f015133dab705816208dff824 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_6/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does Nathan think Isabella thinks Chloe thinks the peach is? +Answer: red_basket +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4cb74bfbb11101d9b728a806008c99bea222170b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_6/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does William think Nathan thinks Isabella thinks Chloe thinks the peach is? +Answer: red_basket +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..154881032345c0fed5bf35f2f1e99e4ce3f81545 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_7/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where is the asparagus really? +Answer: green_treasure_chest +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1b226f6adaf4684333ac921f66c8a76cf21e6755 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_7/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Aiden really think the asparagus is? +Answer: green_treasure_chest +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b0c75768702b06d77ab8e0bfff40c417627291bd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_7/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Emily think Aiden thinks the asparagus is? +Answer: green_treasure_chest +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..54ee97bd908225a15963a35b38a37c29b93d61dc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_7/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Avery think Emily thinks Aiden thinks the asparagus is? +Answer: green_cupboard +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..da6d1c69773863860ebd9ba90ae84ffe81a0f6b3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_7/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Hannah think Avery thinks Emily thinks Aiden thinks the asparagus is? +Answer: green_cupboard +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fe2dd6d66d56c0518c644fa8bc12b414dbff9f0e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_8/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where is the lettuce really? +Answer: green_pantry +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..33e380bf1415cc1f5e6ee3e9bc2a4433e55925f3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_8/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Isla really think the lettuce is? +Answer: green_pantry +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b8dc4b2354b7ab676c0d159f2ed9962c351067ad --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_8/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Charlotte think Isla thinks the lettuce is? +Answer: blue_cupboard +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cf72b94256e6388980f3711060fabc66f38edfb7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_8/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Amelia think Charlotte thinks Isla thinks the lettuce is? +Answer: blue_cupboard +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0b0d5edfb5822e590238cc4307caf2d6f7760b5e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_8/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Aiden think Amelia thinks Charlotte thinks Isla thinks the lettuce is? +Answer: green_pantry +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b84870ec124e3ec3fc5d0007c9418fdaacdefc36 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_9/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where is the apple really? +Answer: green_bottle +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..530bde89e72e80cedebe707c92eda0254a628e20 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_9/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Jack really think the apple is? +Answer: green_bottle +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8755813b107d561134796afd89d04b51ab350a4f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_9/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Evelyn think Jack thinks the apple is? +Answer: green_bottle +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7f720461b55458003c7678d5c8207525da2d8b22 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_9/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Ella think Evelyn thinks Jack thinks the apple is? +Answer: green_pantry +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..092dff2a3b787265b0bcdef4ec9a6ec6675a45e4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_2/sample_9/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Amelia think Ella thinks Evelyn thinks Jack thinks the apple is? +Answer: green_pantry +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..214dc54b506484e14ab1ce0ad577fdb0216c5f46 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_1/order_0.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where is the peas really? +Answer: green_bottle +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..355bb7bf7b02d965c5efee3beb8e1dbbce43c5f7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_1/order_1.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Jack really think the peas is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e1a3a23230e198397408eebe66f53a078dfb12f0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_1/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Jackson think Jack thinks the peas is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1acf4fb700ade2539dae2c9057df03eacd6babbe --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_1/order_3.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Logan think Jackson thinks Jack thinks the peas is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8fffcb13872fc61cd3609834d39261b252a5339c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_1/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Isabella think Logan thinks Jackson thinks Jack thinks the peas is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2f4c430ae25f1aed94c11c674882130a1731ea63 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_10/order_0.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where is the persimmon really? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8699e13bb7634707dd44784de6033ccce6be526b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_10/order_1.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Mila really think the persimmon is? +Answer: green_bucket +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1286098b2dc6a597e6f877dfaefc0799d68bb7e3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_10/order_2.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Emily think Mila thinks the persimmon is? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..dd9de1be36f860938afeecf6b110a6e2592d6c64 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_10/order_3.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Charlotte think Emily thinks Mila thinks the persimmon is? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b4e27fc88d71924dff7289c03035171283d89e3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_10/order_4.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Benjamin think Charlotte thinks Emily thinks Mila thinks the persimmon is? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e80fe4eb4bb3d2ba17c8fef22f1cfc74d5bab114 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_11/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where is the spinach really? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6b477f267d73a18d0a6306384afb1b83e1c1a92a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_11/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Abigail really think the spinach is? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..281e4829d0b95da6d1f01d9e48bf669c98f2a37b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_11/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Benjamin think Abigail thinks the spinach is? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..bc33f8662ec5f3a90995cc70f33516e7f288f00c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_11/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Jack think Benjamin thinks Abigail thinks the spinach is? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..221bdb1abf16b70819cc2c4777c2e545af418340 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_11/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Amelia think Jack thinks Benjamin thinks Abigail thinks the spinach is? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..895c459a8124182266d1ddadfeba1530f32638c1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_12/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where is the spinach really? +Answer: green_pantry +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d73963fe89410a985b693cfffa77ac87ff1c9316 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_12/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Avery really think the spinach is? +Answer: green_pantry +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4acd65113e81132d93776d96c105aebce45320be --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_12/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Hannah think Avery thinks the spinach is? +Answer: red_crate +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a9a9d6ef95f61adee2729a023b382bc012bfeaa0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_12/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Isabella think Hannah thinks Avery thinks the spinach is? +Answer: green_pantry +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a60cfc2e4ac2da0e9f07eb07319ec85d7733afe7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_12/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Nathan think Isabella thinks Hannah thinks Avery thinks the spinach is? +Answer: green_pantry +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c85083a28520eeca742e383780b2befd8f5661e4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_13/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where is the onion really? +Answer: green_crate +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b083aba0e559837f3ddf79487ac37095a8a6ae31 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_13/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Mila really think the onion is? +Answer: red_bucket +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f0a1a279317cbf48fd66f76fbcd20bb8c25bdce --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_13/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Abigail think Mila thinks the onion is? +Answer: blue_bucket +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ffefd85597e70890f1370d2b918e1631eb0078e0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_13/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Jack think Abigail thinks Mila thinks the onion is? +Answer: green_crate +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..841f0a63d09322e2e1662f2686d2ebe4aada1b9a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_13/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Emily think Jack thinks Abigail thinks Mila thinks the onion is? +Answer: green_crate +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5bb1283b55eb054cc5f805dde9b69043df97ba8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_14/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where is the carrot really? +Answer: green_crate +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..38bea07f8548cdd7a2ac0c542e42f5058c5d662f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_14/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Abigail really think the carrot is? +Answer: red_drawer +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a0e936be18e66ce4a95917bd98abadd021b5c3a1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_14/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Nathan think Abigail thinks the carrot is? +Answer: red_envelope +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1a24f939340b4ef596765cda6449d64aed35299f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_14/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Avery think Nathan thinks Abigail thinks the carrot is? +Answer: red_envelope +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e293d76b226ca292cd46a23def765bd4c5cbf22e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_14/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Isabella think Avery thinks Nathan thinks Abigail thinks the carrot is? +Answer: red_envelope +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e77ef7751751fe9b44c4477002cc30692bf49735 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_15/order_0.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where is the peach really? +Answer: red_pantry +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cce7cd6d62a0a58f91d326ac29300d2739c4c58f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_15/order_1.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Abigail really think the peach is? +Answer: red_pantry +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..507c57cb4966a9617a8c8db8af18eb9428970ef4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_15/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Sophia think Abigail thinks the peach is? +Answer: red_bucket +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ef845223b7f22f5d6e9c29201923c07336d4f44e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_15/order_3.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Aiden think Sophia thinks Abigail thinks the peach is? +Answer: red_bucket +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9637149d0045fa402dc5929c65195a31b78c09ba --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_15/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Isla think Aiden thinks Sophia thinks Abigail thinks the peach is? +Answer: red_bucket +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1296a2390bfd1fba40e644acfd6fcda1a196430a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_16/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where is the cherry really? +Answer: blue_cupboard +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d270c121946314556bf27b897cbc8d58f51e1ab4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_16/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Aiden really think the cherry is? +Answer: blue_cupboard +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a86450e4b4ecbc6d074c51c0a0e7c8395e45cf75 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_16/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Noah think Aiden thinks the cherry is? +Answer: green_envelope +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..933730d3a47e382ef518fb333f28bafe932080a5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_16/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Owen think Noah thinks Aiden thinks the cherry is? +Answer: green_envelope +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..efa30f55a30d9d76a18e1c2eee49b99d57b921c4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_16/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Ella think Owen thinks Noah thinks Aiden thinks the cherry is? +Answer: green_envelope +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..03b6e4ce5d9a4972d1b31b4303c296b79899cf9a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_17/order_0.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where is the turnip really? +Answer: green_crate +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d633ed366371f49b84ffc1ae39c3708c6b1a7400 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_17/order_1.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does William really think the turnip is? +Answer: red_bottle +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c09eb81ae5349a9848595c7276d39e1809670720 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_17/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does Benjamin think William thinks the turnip is? +Answer: red_bottle +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..71e737bf90e101f3f928e6010849e66cd1aa47e0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_17/order_3.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does Sophia think Benjamin thinks William thinks the turnip is? +Answer: green_crate +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..36486b6ddd4c1ed1f9f56cf5d6f4223e2847bcaa --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_17/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does Liam think Sophia thinks Benjamin thinks William thinks the turnip is? +Answer: green_crate +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0e801321afa4e3efb8703e242d89ae16a9e7355c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_18/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where is the cabbage really? +Answer: green_crate +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..aa595ecadb99d935e301dab3a04e41bdbdc1766d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_18/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does Carter really think the cabbage is? +Answer: green_crate +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..89b7716e3185f79bfd86a1135471dacfbfb3c2fd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_18/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does Avery think Carter thinks the cabbage is? +Answer: green_bucket +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7a2421a526a4ec2899e982328d8bb73e34e4ef62 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_18/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does Aiden think Avery thinks Carter thinks the cabbage is? +Answer: green_bucket +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..38f8b6d40e6900bb18ab36fc2b704e41ae7d91cd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_18/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does William think Aiden thinks Avery thinks Carter thinks the cabbage is? +Answer: green_bucket +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..aa3db8a52bf5b407bb7f1a866a50b872fca3089d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_19/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where is the cherry really? +Answer: blue_container +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..26f236b8a7a1e31e7b65c73f97c129a906ba1196 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_19/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does William really think the cherry is? +Answer: green_basket +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..efa819448649361a77ddc03b102c6bef329c5034 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_19/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does Ava think William thinks the cherry is? +Answer: green_basket +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..697be74cc526dd1994720fc2de23a4a34220f199 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_19/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does Logan think Ava thinks William thinks the cherry is? +Answer: blue_container +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..22be522449bf2a67fa20de8d8b1ba47ec2fa78de --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_19/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does Amelia think Logan thinks Ava thinks William thinks the cherry is? +Answer: blue_container +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..32dfec1e617a51ab5b466f38b1a6d13a7ab63bcc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_2/order_0.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where is the melon really? +Answer: blue_suitcase +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..88026e9662903a80c1fa01ad8be631fc7a762a49 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_2/order_1.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Aiden really think the melon is? +Answer: blue_suitcase +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f67c194a3b259e0d69fa10580db1418d6263f66e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_2/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Owen think Aiden thinks the melon is? +Answer: blue_suitcase +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..69019037b36b8af38393519af2663b11dd46b754 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_2/order_3.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Ella think Owen thinks Aiden thinks the melon is? +Answer: blue_suitcase +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b0001203505c06e9d0d80d3cbbc412afe274dfb2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_2/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Evelyn think Ella thinks Owen thinks Aiden thinks the melon is? +Answer: blue_treasure_chest +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7bff8392087d6183dacdead1ab7a1680f59d2fff --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_20/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where is the turnip really? +Answer: red_envelope +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..badccc476b409c47179e4b905ec4eb39a69e3c6d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_20/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Owen really think the turnip is? +Answer: blue_pantry +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..519655732300c5a68f85e4c7a0d119072e3aa8e7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_20/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Mila think Owen thinks the turnip is? +Answer: green_pantry +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a864e5b072811a654c219f0bd1b7ab25d27dc7bb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_20/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Carter think Mila thinks Owen thinks the turnip is? +Answer: green_pantry +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6e3ba9dce43ec87e60c17c182794a181e4dea71c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_20/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Isla think Carter thinks Mila thinks Owen thinks the turnip is? +Answer: green_pantry +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..02669d864bd380e43ccdcdc6996f958537457a83 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_3/order_0.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where is the spinach really? +Answer: green_crate +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fdbf56a5053db977f88661b1faf3bfd20796187b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_3/order_1.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Jacob really think the spinach is? +Answer: green_crate +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5d30ce4e5ce1c0bc7d9a27ca2001a3a9c85e545 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_3/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Jackson think Jacob thinks the spinach is? +Answer: red_drawer +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..0cc2689c87e4d46c7ccebbf57cc4fc2a27ad9df9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_3/order_3.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Jack think Jackson thinks Jacob thinks the spinach is? +Answer: red_container +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2a92e59bc2d5149d7b58cb9f3eb1eae2b2524596 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_3/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Ella think Jack thinks Jackson thinks Jacob thinks the spinach is? +Answer: red_container +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..736db6a2a090db9b69aa4ca4d60fe907f2fea164 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_4/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where is the corn really? +Answer: green_bottle +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..29b9d148c559f7b7925979a14018654445fa46cb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_4/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Amelia really think the corn is? +Answer: green_envelope +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..791a53e33ea96a9631a8e42b082c6b23df42f44d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_4/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Nathan think Amelia thinks the corn is? +Answer: green_bottle +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..56fdd5feaba14fe4a8b72154f4f290056c40dfd3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_4/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Lily think Nathan thinks Amelia thinks the corn is? +Answer: green_bottle +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..dde24a6592009efcc4edbb627d61f1236d75d7bb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_4/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Alexander think Lily thinks Nathan thinks Amelia thinks the corn is? +Answer: green_bottle +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a72def29959a92153ad2bebca4ac3de06b9b606a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_5/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where is the sweet_potato really? +Answer: red_box +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a22571cd34256e9dc6f14a027b76d8d9cb1aa471 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_5/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Sophia really think the sweet_potato is? +Answer: red_box +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..28e9839e76884a4387542fa161ba5948c1c6640e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_5/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Jackson think Sophia thinks the sweet_potato is? +Answer: red_box +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1aefc5a4a2b417e28b3f8a678773885426ce11ce --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_5/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Avery think Jackson thinks Sophia thinks the sweet_potato is? +Answer: green_bottle +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a5661b359316bf2e2b2aa82a8bf6d09fb6d33829 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_5/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Hannah think Avery thinks Jackson thinks Sophia thinks the sweet_potato is? +Answer: red_box +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e1adbec1fb0b2ed0e41dcc959b9f1219ca142a4a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_6/order_0.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where is the orange really? +Answer: blue_bucket +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f4fb2f69aa9173032734853e5b462ebe5c9a837f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_6/order_1.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Owen really think the orange is? +Answer: red_container +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..879276607de271afc9be5ccd766cc3a8b86d59c1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_6/order_2.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Isabella think Owen thinks the orange is? +Answer: red_container +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..19dbca3c2b8b8b4edd53851fe50a3af8beeea18f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_6/order_3.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Jacob think Isabella thinks Owen thinks the orange is? +Answer: green_box +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6cd85f54ccb766d0ec2f7474ddce825d03ed8efa --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_6/order_4.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Hannah think Jacob thinks Isabella thinks Owen thinks the orange is? +Answer: green_box +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e5454ba4ee95e2719a8ce89426c831d7a4a8236a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_7/order_0.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where is the lime really? +Answer: green_bottle +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..99a74994fbfa509a5cf9894cab8919daf8a98cec --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_7/order_1.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Amelia really think the lime is? +Answer: green_envelope +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..eaac98535505d83adec76639638f6cac9d11061e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_7/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Sophia think Amelia thinks the lime is? +Answer: green_bottle +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..57019d69cdeb080822f5521fa00da7dde9b0e776 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_7/order_3.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Chloe think Sophia thinks Amelia thinks the lime is? +Answer: green_bottle +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f194ea4eab504fbcdec065e28deb97be6c6c0abe --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_7/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Isabella think Chloe thinks Sophia thinks Amelia thinks the lime is? +Answer: green_bottle +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..199a6e72467219d7322dabcb83cf9ad35ea3a3f3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_8/order_0.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where is the carrot really? +Answer: red_pantry +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a16efee214c538ba3b0eeae168525217b34863b0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_8/order_1.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Chloe really think the carrot is? +Answer: green_box +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..66506950b5f53db5e895be7adeed43b17011177a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_8/order_2.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Amelia think Chloe thinks the carrot is? +Answer: red_bucket +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b8916e61c713924b2475c8ae83b3763c3535858 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_8/order_3.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Avery think Amelia thinks Chloe thinks the carrot is? +Answer: red_pantry +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0436d9f9f6bdbe93d13d42de4e851d21e38187d3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_8/order_4.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Sophia think Avery thinks Amelia thinks Chloe thinks the carrot is? +Answer: red_pantry +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d950a4844758ff4b22ec3ff85de39ab009f84583 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_9/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where is the watermelon really? +Answer: blue_container +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3a181dbeab1944f712261422fc85077638366a3a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_9/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Isla really think the watermelon is? +Answer: blue_cupboard +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3d79226986ff6a3466940bf8ace9d23f426ee921 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_9/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Carter think Isla thinks the watermelon is? +Answer: blue_container +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..287f68a710b95466370e5b53e74d188132e3e5b9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_9/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Elizabeth think Carter thinks Isla thinks the watermelon is? +Answer: blue_bottle +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c81d48b9f838c90bee07d236ce3240e04d48938c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_data/Tell/MC/length_3/sample_9/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Nathan think Elizabeth thinks Carter thinks Isla thinks the watermelon is? +Answer: blue_bottle +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1db200c8a362b9eb9b566581fae3fe6c289fab34 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_1/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where is the lettuce really? +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..13ba0f91ba41323f807f0363f60ced4cd6a16407 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_1/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Avery really think the lettuce is? +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..67b5d39341912b9a49e363dbd5a31e684acecf34 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_1/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Charlotte think Avery thinks the lettuce is? +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..864e9f9ae7f3ed7510e7fae97686c42fff662a6e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_1/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Owen think Charlotte thinks Avery thinks the lettuce is? +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2cc1280cec987c7c7f609a213052b5c4af5b23fe --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_1/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Isabella think Owen thinks Charlotte thinks Avery thinks the lettuce is? +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..08f915286f2084d6a2be75e4b9c558fb94e9d3a6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_10/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where is the plum really? +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c5579db840a4a3eb0865cc0dd7b26eae8ebd209a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_10/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does William really think the plum is? +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4397ff00f50ec5d0679515b1b1b613548f807832 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_10/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does Nathan think William thinks the plum is? +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b5d50a0c536e4eb394e5d9dd1a6873a61f2503d1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_10/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does Evelyn think Nathan thinks William thinks the plum is? +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..dc974e0cb107f7882aa975d4c08be2f289166279 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_10/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does Jacob think Evelyn thinks Nathan thinks William thinks the plum is? +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e1c86abf5f5c5f975f8b94706f21294561734580 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_11/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where is the orange really? +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ac205a72ec92be0b5636db992d3f2d6dcf70a939 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_11/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Ella really think the orange is? +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..89fc6dbb52f1a40a204c8e56d2b5ab7f91666d8c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_11/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Elizabeth think Ella thinks the orange is? +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1d92f512422a2e9b1716d3c5e26c479425391751 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_11/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Chloe think Elizabeth thinks Ella thinks the orange is? +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0160e56aa263f6a49c6a9f3233dfe14c48da1363 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_11/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Alexander think Chloe thinks Elizabeth thinks Ella thinks the orange is? +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d2146d28e9dd6773bd308b87450c4298a8dd1367 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_12/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where is the melon really? +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..97d69a0224ca3747595fc1baf9cd2ed2df908c60 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_12/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does William really think the melon is? +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a1181944a7be2a3abb5f9c06e4b2d08d73e8e440 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_12/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does Mila think William thinks the melon is? +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..675565375008876e6c365fb98937f4403c77d713 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_12/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does Ella think Mila thinks William thinks the melon is? +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..429ac58c46bf9a53e7f35bb6b2638f6203259e52 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_12/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does Ava think Ella thinks Mila thinks William thinks the melon is? +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b020ace8aa69fb8ed18dbb854bd58c5376e43c43 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_13/order_0.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where is the cabbage really? +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..67413d393d8c64449b235751705c8f1955c2800a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_13/order_1.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Abigail really think the cabbage is? +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d273a2e5f9c08a506f39186a9978f2f35c714cd0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_13/order_2.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Nathan think Abigail thinks the cabbage is? +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..375f121b0b9eb56690d4bf54ed0044bf7e811ee3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_13/order_3.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Amelia think Nathan thinks Abigail thinks the cabbage is? +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..fe1aeb65dc3a7bd0915577d00cb0fe1cba6aea03 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_13/order_4.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Charlotte think Amelia thinks Nathan thinks Abigail thinks the cabbage is? +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5feb1cc2d07a162f3455321885242cf70f8c8aa9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_14/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where is the lime really? +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e28b6d48cbd488a8283b32ea973d287e9240fb62 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_14/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Abigail really think the lime is? +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..235efd152b8b415c68ce058e440c969e97ef5906 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_14/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Avery think Abigail thinks the lime is? +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ace5e637eda8e63200f35fd7610d214248d222a2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_14/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Jack think Avery thinks Abigail thinks the lime is? +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..be9cdf8f8d1cd2e7e2a3257acdfa78dc9c1c09bd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_14/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Aiden think Jack thinks Avery thinks Abigail thinks the lime is? +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..47f97145f874e66cc36f02b6ac99387b41ed67ad --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_15/order_0.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where is the watermelon really? +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..bbfe4788f54ab3798d800cd1c95354ce28e0fa8f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_15/order_1.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Avery really think the watermelon is? +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5b228536f7f8093412b781de453495b7b0004f64 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_15/order_2.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Owen think Avery thinks the watermelon is? +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..96a480ec5a471c6679a3048ddce00d55ed36ac33 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_15/order_3.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Ella think Owen thinks Avery thinks the watermelon is? +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..19eea08b58f61db40d1f8d24fc146d2bcdb37f68 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_15/order_4.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Amelia think Ella thinks Owen thinks Avery thinks the watermelon is? +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..090df54a26d96afb8789d7a8096d192f17b50e9d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_16/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where is the carrot really? +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4803e6fc9066b043b80562ddfa9db19f2cee5cb7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_16/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does William really think the carrot is? +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..38e821fc13138ccc1d15c83db8ebbb04629147ab --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_16/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does Evelyn think William thinks the carrot is? +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..421d14e44b2ffa43e0a5e53ac0d7b6091660730e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_16/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does Logan think Evelyn thinks William thinks the carrot is? +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c80519eea5a2d7657bd689fc2bf5cc0edbd9a1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_16/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does Alexander think Logan thinks Evelyn thinks William thinks the carrot is? +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f3572508d621958b8b014b03ce59d8a3f50bb97 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_17/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where is the lettuce really? +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c85819f82a565a77f8f37a180ecd9680a6113ac9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_17/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Liam really think the lettuce is? +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9e3a68a197e0a86305b0769ea93de24e03b1fac5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_17/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Emma think Liam thinks the lettuce is? +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..55bd7deb70cf94bc76570db56cc57c9056a4aa87 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_17/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Mila think Emma thinks Liam thinks the lettuce is? +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3e6e21ddde60ae1f7be30e79731086d26a5e1439 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_17/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Avery think Mila thinks Emma thinks Liam thinks the lettuce is? +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..68f83462311635cd0f445139b91b2e3b7a2c01ee --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_18/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where is the corn really? +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fa22cfd45bec23251223affbb5f87bf56bbb1f4a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_18/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Benjamin really think the corn is? +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc1b5279b691acb958a0d0a271c1a2c6650b5002 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_18/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Jackson think Benjamin thinks the corn is? +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..71a187ed2e21613dbffcc7a692f2a156057e6e59 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_18/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Liam think Jackson thinks Benjamin thinks the corn is? +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c73031d39ed08a0c21c7b4216bd8159ddb162267 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_18/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Charlotte think Liam thinks Jackson thinks Benjamin thinks the corn is? +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e64c5923db84d1a29383d958e81dd8e774d70b87 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_19/order_0.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where is the asparagus really? +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8fb3c7d652ce0e7a6bb51f8762cf0881d7ff2076 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_19/order_1.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Emily really think the asparagus is? +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5a34b6fe022e65b4fdc263aba601d27aca8b6355 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_19/order_2.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Hannah think Emily thinks the asparagus is? +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6c74ce01359b17aaa19ad367168aeb5eb83fe863 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_19/order_3.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Amelia think Hannah thinks Emily thinks the asparagus is? +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..88f1f1c19bd98b89f3916c27b4ffb21be755b707 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_19/order_4.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Abigail think Amelia thinks Hannah thinks Emily thinks the asparagus is? +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..85cfdb0bbb59f3f694d686b6dd31fa0ed344bca9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_2/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where is the tomato really? +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e49fb6c742bfa6247d3f72d0420e3a8ec7a09511 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_2/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Jacob really think the tomato is? +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f3292f9e68b5105f74b1ec88c733bea733f3a9ef --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_2/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Hannah think Jacob thinks the tomato is? +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5eefa4cfee0a0ba88455d8aecbe52f9d0fcb7ae3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_2/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Isabella think Hannah thinks Jacob thinks the tomato is? +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b29d8662753f76bf9a77665ca578557e2c59ecc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_2/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Elizabeth think Isabella thinks Hannah thinks Jacob thinks the tomato is? +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ac244dc575610c58b06481f215f520fdf1521ecb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_20/order_0.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where is the watermelon really? +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b06e8a8c7f5afe5640cc571fb84adc6396fd5847 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_20/order_1.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Ava really think the watermelon is? +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1123c1a426c66e5a53b81234c00698ebc85ace55 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_20/order_2.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Jacob think Ava thinks the watermelon is? +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..40d7e691d6787b87270aa151fb27b894a1e071d6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_20/order_3.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Emily think Jacob thinks Ava thinks the watermelon is? +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d288bb999aa22a16f1047143b91e9397cd7deba3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_20/order_4.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Evelyn think Emily thinks Jacob thinks Ava thinks the watermelon is? +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5941daf9ca4b320099ae6e7e4607531ae465b4ac --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_3/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where is the eggplant really? +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a96274904710a309ea3d0cc9ac4e2500553d3290 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_3/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Noah really think the eggplant is? +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c1bc6d648fe9ec00e28b6c609fefb3faf0ce3f32 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_3/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Hannah think Noah thinks the eggplant is? +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..826a636525351614a7931d63a8127106ee052b02 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_3/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Jack think Hannah thinks Noah thinks the eggplant is? +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..25f3b1be1b4c71381f633c778bed4186e13219e7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_3/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Owen think Jack thinks Hannah thinks Noah thinks the eggplant is? +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0fc59590d02e7d3b20daecf2c1da73a20cb948b1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_4/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where is the spinach really? +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8f822d56ea4c2e77e14224da72cc7ed72b250005 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_4/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Noah really think the spinach is? +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9601fc583e5a5ecea1cac825c0e838dce2289308 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_4/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Mila think Noah thinks the spinach is? +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..bf9340805361110e5c8a60071d83f6d3a8232406 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_4/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Emily think Mila thinks Noah thinks the spinach is? +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a042d3fb03d58ea41930b802f376eabd15c5dfdf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_4/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Evelyn think Emily thinks Mila thinks Noah thinks the spinach is? +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..dff9b9b42b35b0cb7c65795fb65de724d1912a0d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_5/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where is the potato really? +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0d617fefaa5a2edf2a91fa94c8fa3313c1b3d0d1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_5/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Logan really think the potato is? +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b0cb890d9a93abcd6c666443a901f340c37c534d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_5/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Benjamin think Logan thinks the potato is? +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..77bf78b4c8dd8b20f428d568e87d48dcca9f40b1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_5/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Charlotte think Benjamin thinks Logan thinks the potato is? +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7a161f499d195f77ace3e77406012785fabbea5a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_5/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Hannah think Charlotte thinks Benjamin thinks Logan thinks the potato is? +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0b098b61e9daef2fef67792eda3c3a6642d50604 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_6/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where is the apple really? +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..561272f8d0d83a4a886dd284f424da91f59987a2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_6/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Lily really think the apple is? +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..63c9c3903d8a8d1cc34c9463ec279e8b51752f13 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_6/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Hannah think Lily thinks the apple is? +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b8509440f9155dd20a8a1c4b4daae4970abb45eb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_6/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Jack think Hannah thinks Lily thinks the apple is? +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..68fc189a7101f19adb3293893d4279ae34b0a4f5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_6/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Aiden think Jack thinks Hannah thinks Lily thinks the apple is? +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..45d0698a8390045bfae472fca484d0b284ecb2d1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_7/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where is the spinach really? +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5eb78ce2cae42d1ccfaedb6db0e1b61c06736ff4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_7/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Emma really think the spinach is? +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3f878279e16409af31ed403e97e52f16528de1ed --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_7/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Ella think Emma thinks the spinach is? +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..991844b22f9251b1a40aa68dd57045a8993c0789 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_7/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Aiden think Ella thinks Emma thinks the spinach is? +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..846825240a0268e183d02c9196303fadf976abe4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_7/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Benjamin think Aiden thinks Ella thinks Emma thinks the spinach is? +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b33bbf0ea2a7666bfbca1edff555915c74771b83 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_8/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where is the corn really? +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..082a828b63321d31261ecca22302ea057501a0ee --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_8/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Sophia really think the corn is? +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7983e63a27ef0df459f8a645c4f31a6faa1cfc92 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_8/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Chloe think Sophia thinks the corn is? +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..88925a5dc0f8199e5214310c0338b9e785496546 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_8/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Ella think Chloe thinks Sophia thinks the corn is? +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..212a7e6a665fea8f8b326667cba69cf329858b8c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_8/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Owen think Ella thinks Chloe thinks Sophia thinks the corn is? +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3967a403f13772e48cf2ac301d872f426e6aed41 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_9/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where is the banana really? +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fc4799929b758271f40c8a6b7df311c171213124 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_9/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Abigail really think the banana is? +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c88115faca629d9e22a4e05535df6a6734e7c929 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_9/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Ella think Abigail thinks the banana is? +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4d41fdcf7c69e0ea19eb23e2060c6be15c771557 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_9/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Elizabeth think Ella thinks Abigail thinks the banana is? +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5e2a7e3ff61ccaf3f597deeca4f09e68d45ca1f5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_1/sample_9/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Owen think Elizabeth thinks Ella thinks Abigail thinks the banana is? +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b764539c5d72c32267fa3ab9a7661e5c4c38d0fc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_1/order_0.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where is the cucumber really? +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8d370d22bed3cf570e56a2778ad445c17890c3bb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_1/order_1.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Evelyn really think the cucumber is? +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5fcb29f518e1abe8f9b0e8ad5f256d4aec23e99e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_1/order_2.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Ava think Evelyn thinks the cucumber is? +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8c12a1f4f9c106d5c4d5839f99c2d7dbfe774405 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_1/order_3.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Charlotte think Ava thinks Evelyn thinks the cucumber is? +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4746e73c1056752d1b995f9bd22ed18d91f7560b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_1/order_4.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Jacob think Charlotte thinks Ava thinks Evelyn thinks the cucumber is? +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..03936effdc928926dee3b4192d0cb810bcaeb2ff --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_10/order_0.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where is the orange really? +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0669ebf07a3da9a64e75bb123a11e9dcc5e5ba7e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_10/order_1.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Hannah really think the orange is? +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..aa2c9b7a3142030283a840ca4233cad4f9ad3e93 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_10/order_2.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Aiden think Hannah thinks the orange is? +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba1ba75aebf899780b09954c3d6974483d11e23b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_10/order_3.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Jack think Aiden thinks Hannah thinks the orange is? +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e9428ba79e94696dcb6e8e87246fe7cf1b566116 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_10/order_4.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Alexander think Jack thinks Aiden thinks Hannah thinks the orange is? +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..77c6fa704af0c34f7f75e7168abe5d6d5bc38ce3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_11/order_0.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where is the cherry really? +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..514e32890f2203a082fac860d94d21b559c02fe1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_11/order_1.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Avery really think the cherry is? +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1efd530dc4fb14c98f2a3f5ec92fb2eed48a3538 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_11/order_2.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Lily think Avery thinks the cherry is? +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..99c1a5415979703cb348deb174a030244fa25624 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_11/order_3.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Ella think Lily thinks Avery thinks the cherry is? +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..28dce70abf1427fa6388050c7a6e5254c539a364 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_11/order_4.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Emily think Ella thinks Lily thinks Avery thinks the cherry is? +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8b492fe1761075395146d19cd29571e0919bfc94 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_12/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where is the pear really? +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..bf8a2a9c5991015213ac149fda5bece1f1246b0a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_12/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does Charlotte really think the pear is? +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1587d5781c960cb45fdeb4897f4cde11ae7d9d19 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_12/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does Alexander think Charlotte thinks the pear is? +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a192fbc22dafc99dc600e1fb7537afd3f607e3a1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_12/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does Ava think Alexander thinks Charlotte thinks the pear is? +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7ee04d7a4b2e55d0995aed37bcde0133c09ee5c1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_12/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does William think Ava thinks Alexander thinks Charlotte thinks the pear is? +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5a6472e973367273180b612c071e53c767aa8eda --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_13/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where is the watermelon really? +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..865202b785278d5ddb09fe01b8b590d3e2bec118 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_13/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Carter really think the watermelon is? +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4d328bf13071b3bb821bc092c7db260135f84599 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_13/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Avery think Carter thinks the watermelon is? +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..0dd54ab991b224ca3db947e714d0ed6b1fae40e1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_13/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Isla think Avery thinks Carter thinks the watermelon is? +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b5d17205e54953b6edfa36c6577630461ad33f2f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_13/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Sophia think Isla thinks Avery thinks Carter thinks the watermelon is? +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..74c68f1cbedc171e51833fea3c75208cf8003507 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_14/order_0.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where is the lemon really? +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..665e55c2bb717337b9a32afea69d45076772c574 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_14/order_1.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Isla really think the lemon is? +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c19043f325aede096d3965005040b51f982f85b0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_14/order_2.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Sophia think Isla thinks the lemon is? +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f3199f2c04cae2e7a3b733f9af0909a1729d9136 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_14/order_3.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Evelyn think Sophia thinks Isla thinks the lemon is? +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3cc40f0d981c94df4c0b8f0cf4c3be2035323c71 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_14/order_4.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Alexander think Evelyn thinks Sophia thinks Isla thinks the lemon is? +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b818122a668133ceb31a38e4cd29d9f2c9db57f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_15/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where is the corn really? +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6c7f51d5c7cdcdf69d48d5e62aa5845c5efbe89b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_15/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Abigail really think the corn is? +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e16f25b7f68c621620bd7ed6a50645e9f13ce31c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_15/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Nathan think Abigail thinks the corn is? +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7da92f8e8cf3614c23adb00d61455784208a3037 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_15/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Avery think Nathan thinks Abigail thinks the corn is? +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..235f0a2af06c4acae4c0de3ecadda17827cbdb91 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_15/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Hannah think Avery thinks Nathan thinks Abigail thinks the corn is? +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7494e0fe6ba607a1227a460d9a88af55d97fac41 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_16/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where is the tangerine really? +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc6868f70d95ccb7ee8e995448e4e8655d1372d9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_16/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Benjamin really think the tangerine is? +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1d5b0542bb135710b80c016f732a3dd703a5b801 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_16/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Liam think Benjamin thinks the tangerine is? +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e2b0ea0f4102f3db3d49c78bfd6fc8b76ce6117a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_16/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Carter think Liam thinks Benjamin thinks the tangerine is? +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b7043a5c73653bc0bf905ccb7120f937bae7804f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_16/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Jackson think Carter thinks Liam thinks Benjamin thinks the tangerine is? +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..383039818033f196f62ff42afeb88e9042a97e83 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_17/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where is the lime really? +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0cfc0479b449d697fcf9f586611e1ece06863236 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_17/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Owen really think the lime is? +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..402773194c0741a014fbb38e2ae1b84dd407273f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_17/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Emily think Owen thinks the lime is? +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1fad99d7ef383e4a22e9ea13ee8475fb2f2857f2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_17/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Lily think Emily thinks Owen thinks the lime is? +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..889e9ded579d23a10ac6a6cc05ac0aa91b3d1d1f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_17/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Ella think Lily thinks Emily thinks Owen thinks the lime is? +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e81ab652d7655dd24f381cd8e6346dc0125aa9db --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_18/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where is the corn really? +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9342af4ee8b79e786576b930dabd9a410f7e9df2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_18/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Noah really think the corn is? +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..aec247a1dd3e0aa3903dc378400506e165677856 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_18/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Lily think Noah thinks the corn is? +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6e09011888e1d94efb33bbb3d278c5a7a2c06d32 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_18/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Isla think Lily thinks Noah thinks the corn is? +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c7388051f516ac306d6cda677e62381ce998dac4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_18/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Mila think Isla thinks Lily thinks Noah thinks the corn is? +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3ed3f36134171a8d068b9cb7083c29df380e54ab --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_19/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where is the tomato really? +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..72d13e22235167c688a5bcace8322963ec4a7136 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_19/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Jackson really think the tomato is? +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..0fbcc2ed9e5e2560c0b70dbb760aca184dfeff87 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_19/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Nathan think Jackson thinks the tomato is? +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..33ba6bdb40623828292ccf77f4adf1c897dfef0a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_19/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Amelia think Nathan thinks Jackson thinks the tomato is? +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..58110a14b7940072e8bf4567be6a91c71e5e7551 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_19/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Sophia think Amelia thinks Nathan thinks Jackson thinks the tomato is? +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a3b16a07e3eae9eb5b7c35e6dc18a67c3247063d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_2/order_0.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where is the corn really? +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5d83340552b6ed2e64b6d460f41aff57566845a3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_2/order_1.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Amelia really think the corn is? +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3d731c69fc800147fbbd55b3018fd6725f875cb1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_2/order_2.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Lily think Amelia thinks the corn is? +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e856d2f89e6405580c878aca7ffe864b33de9a3e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_2/order_3.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Sophia think Lily thinks Amelia thinks the corn is? +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e1188d3e939ab609f8d79500ca04b69863955182 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_2/order_4.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Liam think Sophia thinks Lily thinks Amelia thinks the corn is? +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b89f8b95438a9fc571ff099329d893315539eb31 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_20/order_0.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where is the peas really? +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3b72a31af03c3506e4423c320a45324f890ff29c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_20/order_1.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Nathan really think the peas is? +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..eb24f3915a18ae484d989a14163949e804e914c4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_20/order_2.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Emily think Nathan thinks the peas is? +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..68a2317cd444e8f18cf99d2ccdeaa8ee2fc74ca6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_20/order_3.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Ella think Emily thinks Nathan thinks the peas is? +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c0fa54e9a0e3b9c2d597c4e88165c5e3d70d155b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_20/order_4.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Evelyn think Ella thinks Emily thinks Nathan thinks the peas is? +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..cb43b8fdad05dc55f4035c9d4314be5245cf95cc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_3/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where is the peas really? +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d78331f34877e0a78815af64a4baec1caa2ec75f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_3/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Benjamin really think the peas is? +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..eda6e3f600f6171f989eb06eeea64574ade03ceb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_3/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Noah think Benjamin thinks the peas is? +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..714a4b15cf4eb9b9317ac3169ca106fcc1d5c6e2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_3/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Liam think Noah thinks Benjamin thinks the peas is? +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..623f2c73b7ef946cbad150dcb79ec21e3ed0909f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_3/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Avery think Liam thinks Noah thinks Benjamin thinks the peas is? +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..166ec276ab19f7c2927e909a18177ae6f989f95e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_4/order_0.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where is the potato really? +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0a2dceff5e6a53da295610f19b0a49f0e588d229 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_4/order_1.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Isabella really think the potato is? +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..54645618de9cef5e761553c09b929576f8dad86b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_4/order_2.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Chloe think Isabella thinks the potato is? +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..30583f0b2ccb9b00f5e4531f1aab69542c1bca55 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_4/order_3.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Evelyn think Chloe thinks Isabella thinks the potato is? +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b906ec3398632ebe89a7dbce37c680b33e6c901 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_4/order_4.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Jacob think Evelyn thinks Chloe thinks Isabella thinks the potato is? +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..923ceacf1d273a047f52a952d7b9dd2e192d628c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_5/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where is the cabbage really? +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8bd3fb719950c6b2e5727924050f302bf8a0ebd2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_5/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Avery really think the cabbage is? +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..32f1aff2ba49184ce6db4878ddfb0ca6d4c318f8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_5/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Aiden think Avery thinks the cabbage is? +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ae2fc228502080e5dab44271c0199a34293f6a9e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_5/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Emma think Aiden thinks Avery thinks the cabbage is? +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e6b2f8125bd9026051899b828472d37cf394a13b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_5/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Noah think Emma thinks Aiden thinks Avery thinks the cabbage is? +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e21af9f1ace40b6786f854a154523eba93b78316 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_6/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where is the melon really? +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..571264c8de01ddb7f183ca39cdad7591d30f58d0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_6/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Owen really think the melon is? +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..757cf526e08a84029612601457f5c87d821b96d3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_6/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Avery think Owen thinks the melon is? +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..efeecfb70527f2ff09efbd1f2f9465a320c8197b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_6/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Benjamin think Avery thinks Owen thinks the melon is? +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..94741231846bde3b012fd70996febd6bde9338d4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_6/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Noah think Benjamin thinks Avery thinks Owen thinks the melon is? +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..eb3a59bc7462a48e2ac0a660c4df3dea33471914 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_7/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where is the melon really? +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..00b4af3463ed81d25b5d750a9cebc0e045717dec --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_7/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Nathan really think the melon is? +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3080ba34ed93db2226067435e54760dd3b615b94 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_7/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Lily think Nathan thinks the melon is? +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..08239f3f972759e1a96a2986149d0df0bc5ea994 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_7/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Isabella think Lily thinks Nathan thinks the melon is? +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ed5332b497ada7212a0b9af8b60a5851184ab9fb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_7/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Ava think Isabella thinks Lily thinks Nathan thinks the melon is? +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1590f7586f958d856c8bf5103a71d818f9354e3b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_8/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where is the watermelon really? +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7a2aeeb857aae9088e92b3aa677b1ee0b7927924 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_8/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Noah really think the watermelon is? +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d43423322d14c30b17822f57a230d45639017036 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_8/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Emma think Noah thinks the watermelon is? +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7efdc631619603c9bdbea02e08c70cf18f420568 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_8/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Liam think Emma thinks Noah thinks the watermelon is? +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6078f4c3d8421613c59f0fb57acf4a391cf5302c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_8/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Owen think Liam thinks Emma thinks Noah thinks the watermelon is? +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b62a10e75f06016e63d95c1bdef6362361b0ae96 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_9/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where is the carrot really? +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1b7df2aa10db285c48cbdaf09964f83d7a8bef4d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_9/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Noah really think the carrot is? +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e7481d0c7adcc191c17b0b2edd429e9e22386ce4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_9/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Owen think Noah thinks the carrot is? +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..480b9c57cdf2ee86aed21d1d2dff550944b2f74b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_9/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Mila think Owen thinks Noah thinks the carrot is? +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..76f001352542272c81cca3ebaa27b54c093d0269 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_2/sample_9/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Lily think Mila thinks Owen thinks Noah thinks the carrot is? +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6bfc7e9588628ebc33c34da26835a4fe178032d0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_1/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where is the lettuce really? +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6d6792ead343d77317b62b881b37ae91992d8979 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_1/order_1.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Isabella really think the lettuce is? +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f82df49fc2fb7047f2047d0f49f16e63b31877b0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_1/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Abigail think Isabella thinks the lettuce is? +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..493efde9b7be9b841f4d0a4945cc53ea64c665e2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_1/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Nathan think Abigail thinks Isabella thinks the lettuce is? +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..88c050d8fe88bd066de6b8e8c120e0b27c3064bd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_1/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Logan think Nathan thinks Abigail thinks Isabella thinks the lettuce is? +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e2dcfdae109f70ae28fbab28f20f2cb99b5878b1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_10/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where is the sweet_potato really? +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..74815fa6e50f64d05067a3c36e5615ef98ca44cc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_10/order_1.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does Evelyn really think the sweet_potato is? +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7c4d613a642cdbecad3bbd97de8d6ffb2dc83cae --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_10/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does Logan think Evelyn thinks the sweet_potato is? +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a213dc933a1c29860bf8d8b83b9d36ef659faaae --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_10/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does Charlotte think Logan thinks Evelyn thinks the sweet_potato is? +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..39a08a66814c5e5a70c75d5b5b212f7ddf0111e7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_10/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does William think Charlotte thinks Logan thinks Evelyn thinks the sweet_potato is? +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..acd634bd064829b29618717e70bb6296021b4c10 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_11/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where is the melon really? +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c350d577f1a6860e1e00e0b69de141a0db099b7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_11/order_1.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does William really think the melon is? +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7692508846187b555587a9d0b4b0a71d89b93980 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_11/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does Lily think William thinks the melon is? +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c8930315bd329d17268a9b9cb72325bf24af0d3c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_11/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does Emma think Lily thinks William thinks the melon is? +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4890c952beca0ec2ee0343225099676532157c51 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_11/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does Isla think Emma thinks Lily thinks William thinks the melon is? +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f422b23ffa8396c59975fe81dd8b54d845a67d54 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_12/order_0.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where is the beans really? +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ed7f6a3c9b645b87ff3d91909d1d3a0c554471c1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_12/order_1.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Jack really think the beans is? +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..02bffdb80b773ca8908bf529ce9a2438ebe51c3f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_12/order_2.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Owen think Jack thinks the beans is? +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b26af71f2cf4c49dec4bb239ad35a834a10ca4f3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_12/order_3.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Liam think Owen thinks Jack thinks the beans is? +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..37b6c871cb459d7bc08003b7e4d1eec32ae242f5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_12/order_4.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Benjamin think Liam thinks Owen thinks Jack thinks the beans is? +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2e166c354b54bd813901574895cefdf0b0445823 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_13/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where is the corn really? +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..53d8586b46b79e2c1c8183f57a9301a091c2f74b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_13/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does William really think the corn is? +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8d61540d1e01d47fdaedd4b261140e51d07d1fbf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_13/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does Emily think William thinks the corn is? +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f577411beb9adca7f8adbc98a1d16ad8c35d73b4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_13/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does Emma think Emily thinks William thinks the corn is? +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8eedc91cc5189629ac4e6d6c2fadb70d991dc376 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_13/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does Jackson think Emma thinks Emily thinks William thinks the corn is? +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3627c0834c6443449867e62a25af75e2ae21e4c3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_14/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where is the cucumber really? +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..db5be640e167c8bce176f873c374e94b6420c834 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_14/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Avery really think the cucumber is? +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4dc30037883a66f300bf007b54f5a03653323d62 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_14/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Abigail think Avery thinks the cucumber is? +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cccb47e8e1a683298893cd63ddcab288bca35956 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_14/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Hannah think Abigail thinks Avery thinks the cucumber is? +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..52c5517baa88f0b752516fcc17df63e30214b1c3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_14/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Owen think Hannah thinks Abigail thinks Avery thinks the cucumber is? +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5aa5c0540aac786528c3d3f933b206164553a019 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_15/order_0.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where is the sweet_potato really? +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1d36e5bf3eaa9031aa8f59694f5446b73e107423 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_15/order_1.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Jacob really think the sweet_potato is? +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1d9f54fe35967dd15f00ef87311ba0b219eabc80 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_15/order_2.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Aiden think Jacob thinks the sweet_potato is? +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..084187a0c59aae5ddaa9accc567026b747d6521b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_15/order_3.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Mila think Aiden thinks Jacob thinks the sweet_potato is? +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a768e303dbac733584eb270c52bb6f55dfd920c4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_15/order_4.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Elizabeth think Mila thinks Aiden thinks Jacob thinks the sweet_potato is? +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..52a6b83e5e40101e7fe93b841af4860d8d253bf7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_16/order_0.txt @@ -0,0 +1,39 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where is the persimmon really? +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5d6afd1a083a004cec944a2218eed8e185d3860c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_16/order_1.txt @@ -0,0 +1,39 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does William really think the persimmon is? +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..401fbbea3403ef86d6a50e6f107f8e28632f5fc2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_16/order_2.txt @@ -0,0 +1,39 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does Hannah think William thinks the persimmon is? +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..005e4c500e695ea9ed2c398de15da51ac07b15c6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_16/order_3.txt @@ -0,0 +1,39 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does Avery think Hannah thinks William thinks the persimmon is? +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a3a60fb4481080bed558d672776f39fb2349b156 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_16/order_4.txt @@ -0,0 +1,39 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does Alexander think Avery thinks Hannah thinks William thinks the persimmon is? +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9273fe549fbd46e5372b8b46dacdfd10e66c7ef1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_17/order_0.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where is the eggplant really? +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7c5733cf670fd62ac08ae2c82cd61e870ed31701 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_17/order_1.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Emma really think the eggplant is? +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c3563f1bbaad32ad8f16ba47cd7a51f0b302783b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_17/order_2.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Jackson think Emma thinks the eggplant is? +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..371e392515a912e9ce92d439f0d4a0396b6ca1ae --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_17/order_3.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Jack think Jackson thinks Emma thinks the eggplant is? +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..63d78575305c93cb5930f7e43551d974a0293f3a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_17/order_4.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Emily think Jack thinks Jackson thinks Emma thinks the eggplant is? +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2bc06c7c7bff4fc2cd7154e68642048e237b3f6c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_18/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where is the lime really? +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1d9de3dcac45dd134757d821dc67f85e92fae90b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_18/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Elizabeth really think the lime is? +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..72e1c9ff78edf8d3204e90f34ca6403e34fb0264 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_18/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Alexander think Elizabeth thinks the lime is? +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..142a4dc56fcc0ac5ba8cd1e3ec8633dabb8508cf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_18/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Owen think Alexander thinks Elizabeth thinks the lime is? +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..39ef2f24f1b01408689a5f0d98401ad5a5e803c5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_18/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Nathan think Owen thinks Alexander thinks Elizabeth thinks the lime is? +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a5099c05a079c30679dc36968b0f7785cec07560 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_19/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where is the pear really? +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c7ce6735a6dce8c565f0336c8c957b0865ca902a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_19/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does Noah really think the pear is? +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..377d05346ec9d582a3d2c7b2822a0e8191e35a57 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_19/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does William think Noah thinks the pear is? +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c4d939966be474090ed3e15da5a3f80a5a307674 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_19/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does Isabella think William thinks Noah thinks the pear is? +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b69645142e071e5c5d14ba55203a9965ccf31074 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_19/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does Aiden think Isabella thinks William thinks Noah thinks the pear is? +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c26c27f5750b08b9f821a24e3d88b1bdbc6bef9a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_2/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where is the onion really? +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..46b2bc97e524401a7132bcbea2da93532fcc4a60 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_2/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Nathan really think the onion is? +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3ddbabd526f62435da0188a14016b81fa356cd2d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_2/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Emily think Nathan thinks the onion is? +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..fd0e0d94155ae0e308c72392583ead8561928ac8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_2/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Owen think Emily thinks Nathan thinks the onion is? +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f35ee8f7eddebdaad849fe33ac4396f214ff49b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_2/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Liam think Owen thinks Emily thinks Nathan thinks the onion is? +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f1be658192b3b77e561733b16d9c6ab7e644545f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_20/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where is the spinach really? +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..62e79d8af1b540320016a6e443d2f646ca4a4d9d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_20/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Evelyn really think the spinach is? +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a85ca221e93b62a4c37fb1a9f17acb5e1c0ee6ff --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_20/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Jackson think Evelyn thinks the spinach is? +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1141a18fba8674ad9413722c15e586b1157a55d1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_20/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Liam think Jackson thinks Evelyn thinks the spinach is? +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..cb5b017665cb170069bbfaff23439fd14d2f4a73 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_20/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Elizabeth think Liam thinks Jackson thinks Evelyn thinks the spinach is? +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..074523780fba12629dd3746c2741a213e2e00a00 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_3/order_0.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where is the peas really? +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d164e7de34ea4376d73ca66d0357b3bbb78cbe3f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_3/order_1.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Isla really think the peas is? +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..edf307577e1c776a33f2441a08dd161ce4b7a6f9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_3/order_2.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Amelia think Isla thinks the peas is? +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..86c9c72ca299768b6a1150d849ddf7fbad19f8ed --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_3/order_3.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Carter think Amelia thinks Isla thinks the peas is? +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1815a0fb68d42c2d348859fcb191e758c405cb61 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_3/order_4.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Mila think Carter thinks Amelia thinks Isla thinks the peas is? +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..48346acc67b0cfe88468dbf3f8eb835f778527cc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_4/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where is the green_pepper really? +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ffb67a8b0a60fb4389a8db2714bcb0c7197f7366 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_4/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Emma really think the green_pepper is? +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..0119257d5409e82a415fffc7df037b9e50975a8f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_4/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Benjamin think Emma thinks the green_pepper is? +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2545b053f5627142f7c5f71ea83670e6f77bc165 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_4/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Jackson think Benjamin thinks Emma thinks the green_pepper is? +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e2f809068a5f512427cbeb34990a9187eb416b37 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_4/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Abigail think Jackson thinks Benjamin thinks Emma thinks the green_pepper is? +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..855843fcdb90d54342a87f4fe83ef0db9f84dc18 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_5/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where is the peas really? +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ea60459c5dd06e7d722cc374a0e38bff4f8bcbf4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_5/order_1.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Hannah really think the peas is? +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..fb7bd40d7a738f113d7f2b353ecb3fd5104fec87 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_5/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Amelia think Hannah thinks the peas is? +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c81cc8437c9fa9daa4be78c21de25c1b2fbf3b5a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_5/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Jackson think Amelia thinks Hannah thinks the peas is? +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..77e9dffc35363f635488807bc9fe4abb1ca4d2e8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_5/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Abigail think Jackson thinks Amelia thinks Hannah thinks the peas is? +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3eaae8ec3bc17cecaad75690b4968d993622cc38 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_6/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where is the turnip really? +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c25a2dd856ce66fe438d50686f5d7b8beeb13af2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_6/order_1.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Hannah really think the turnip is? +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f859adae6265c5167f6d9203ecc771d9a64b5480 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_6/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Lily think Hannah thinks the turnip is? +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..00267a12678fffc113535faf43dd09816f93f950 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_6/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Noah think Lily thinks Hannah thinks the turnip is? +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3754fd996c3a13ebde516f0433eb65423bebcf73 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_6/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Logan think Noah thinks Lily thinks Hannah thinks the turnip is? +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..704c684ba2a1a2c69f8dfdc01015c66bb039baa4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_7/order_0.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where is the watermelon really? +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..56458fd896686a00f34d19776305ff543eedd518 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_7/order_1.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Evelyn really think the watermelon is? +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3eb7e77da2e86334b136da95a93c5ff22570b8af --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_7/order_2.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Logan think Evelyn thinks the watermelon is? +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8493dd7ce4730d93a62156c4e33f4b98e2625abf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_7/order_3.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Chloe think Logan thinks Evelyn thinks the watermelon is? +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..448a7f4a8094a631277471e9b430effb48eb6835 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_7/order_4.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Charlotte think Chloe thinks Logan thinks Evelyn thinks the watermelon is? +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a0f4e8782a03c67834cf839b1b3e5186f58c6779 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_8/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where is the lemon really? +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d39a09b140140f6d836e5d5300f929ba5f1c9672 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_8/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Aiden really think the lemon is? +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2f76d67d1c4dfe2cd79769c9e5b1299c7c88693d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_8/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Nathan think Aiden thinks the lemon is? +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..32d4b65c5e36b88e464b09c0a18306d7321b9707 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_8/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Jack think Nathan thinks Aiden thinks the lemon is? +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c7910b3680a54403c5f6b6516fb84926fd2b543 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_8/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Liam think Jack thinks Nathan thinks Aiden thinks the lemon is? +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..95da30c3ba9503c5f745bc2701be4d7fbffed0f2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_9/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where is the cabbage really? +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..aa10913830f6007f0b76f6a3f83769f05588e8ec --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_9/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Isla really think the cabbage is? +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..40a4e913d075a07ab4085b522ebbb13e4c5beebe --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_9/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Elizabeth think Isla thinks the cabbage is? +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ffd60ebd236676632365e98569b7f7c1179f1d55 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_9/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Abigail think Elizabeth thinks Isla thinks the cabbage is? +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b43707a098e0161446a74ced5bd690c8e91be7bc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/CoT/length_3/sample_9/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Aiden think Abigail thinks Elizabeth thinks Isla thinks the cabbage is? +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1b88f5027fa70d1e963aa304322b1a0673ba84da --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_1/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where is the lettuce really? +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..85a23ccae0a08a38a1379ec7fdb5562081cabb7f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_1/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Avery really think the lettuce is? +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3e4e83a77e00b6744ded2f781431387120cbf1c5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_1/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Charlotte think Avery thinks the lettuce is? +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a1347f290d26b458674511d4f0fc14c0f2f58328 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_1/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Owen think Charlotte thinks Avery thinks the lettuce is? +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0f9f5c4faaa01982da16476d88d619649faeb4b5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_1/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Isabella think Owen thinks Charlotte thinks Avery thinks the lettuce is? +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9d54cfbe38b78cea65188588297a863070f7e499 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_10/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where is the plum really? +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..07a4d20b1412e20eb5a04c44529138e6a58ccab7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_10/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does William really think the plum is? +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..523d050b40142b8c359a186e4e91927e43139a02 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_10/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does Nathan think William thinks the plum is? +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b84e01dbb2cb02cd5d8692d19979b8b1a0bf249c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_10/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does Evelyn think Nathan thinks William thinks the plum is? +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..33d9e3ec7e4bf7975d291ad3a99de712118c517b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_10/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does Jacob think Evelyn thinks Nathan thinks William thinks the plum is? +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8c79dcce2e018b18bc0c8b801a72702b128a89fe --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_11/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where is the orange really? +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c2aa53c0f27117aa271c137e0920e0407f320336 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_11/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Ella really think the orange is? +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6af0703824cc3afd746906042d98136c405a33c5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_11/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Elizabeth think Ella thinks the orange is? +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5bd137cc1f74471fa7faa0cf34de23b753f9f144 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_11/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Chloe think Elizabeth thinks Ella thinks the orange is? +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6cdcb8e10dd8f904d48ab7927315ec8fd2272a6d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_11/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Alexander think Chloe thinks Elizabeth thinks Ella thinks the orange is? +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..cdcc578c6cdd464f80ecaf6299fc08ac4fd2d9bc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_12/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where is the melon really? +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..72eecc1977d05715f957d1800591edc64eddef35 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_12/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does William really think the melon is? +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a6ef62863205f43d0320cefbe68c36439bb297cb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_12/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does Mila think William thinks the melon is? +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f747666d39306651241c28ed4bb1f43a9eff3656 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_12/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does Ella think Mila thinks William thinks the melon is? +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..642cacbd704df616b204181accf133b52cdb8631 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_12/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does Ava think Ella thinks Mila thinks William thinks the melon is? +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2818070a7959a1a983091108af4482d331cac580 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_13/order_0.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where is the cabbage really? +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..673b2639407862b96ea031764c7a25a2332ef430 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_13/order_1.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Abigail really think the cabbage is? +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b2435d9829339fbe127040566076b1b1a8e0ed9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_13/order_2.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Nathan think Abigail thinks the cabbage is? +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d0e39585572b208635fbc5edef9573cabdda9234 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_13/order_3.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Amelia think Nathan thinks Abigail thinks the cabbage is? +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b0e6f4c6d3a59fbe095c4ce3c52dd778d53abd16 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_13/order_4.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Charlotte think Amelia thinks Nathan thinks Abigail thinks the cabbage is? +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3848fb65623a3e51b0e2201ef41f37a2633cc99f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_14/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where is the lime really? +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b7fd6fc5945d49ad49f4640fb71b8d002e5c6836 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_14/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Abigail really think the lime is? +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b715e00ecbb6ba8b1738d69e3355ad746e6f982 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_14/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Avery think Abigail thinks the lime is? +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..34b143d03138e9e64605867354d9c8b9d9a9c698 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_14/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Jack think Avery thinks Abigail thinks the lime is? +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5db1300502bb7f9bc60c3b26cc0aab9740c725a4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_14/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Aiden think Jack thinks Avery thinks Abigail thinks the lime is? +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..31712fe1b13b6a52e88a874b060a510b7ed70813 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_15/order_0.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where is the watermelon really? +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8335b6fb3b3f873faeab9f8a62c538c1a393079d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_15/order_1.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Avery really think the watermelon is? +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5df62cd250be1db48aeaa2aa5c7ab3c1a6b2d96d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_15/order_2.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Owen think Avery thinks the watermelon is? +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5da27feb8cbd5cc59d20fa3ffce92a5eee85dee --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_15/order_3.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Ella think Owen thinks Avery thinks the watermelon is? +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3cad19df70c7ccc97a3e643595dcc72de4624b9b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_15/order_4.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Amelia think Ella thinks Owen thinks Avery thinks the watermelon is? +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2635be5c9ca880655a616a0ca90a5b9ffafed578 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_16/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where is the carrot really? +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..aa0a62c9153e33a261b12a5a02b29dacf7f3d9f4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_16/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does William really think the carrot is? +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..0b1fbf0adbcdfe9a3b40eb5eb7ad6e02a7eb0082 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_16/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does Evelyn think William thinks the carrot is? +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2cafcf54935572e71abb1efe260fa379828f9243 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_16/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does Logan think Evelyn thinks William thinks the carrot is? +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..71e618762aa78c9a4b2721f4bed972a74aaf9ff3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_16/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does Alexander think Logan thinks Evelyn thinks William thinks the carrot is? +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..bf2656a3b002a410d373fd180c68fca8a080383a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_17/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where is the lettuce really? +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..49054d03e8340e787abe7a06a353b073fa9c2800 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_17/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Liam really think the lettuce is? +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d9e9ccf90f12daa41f5536a2c05499c53f5b0e65 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_17/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Emma think Liam thinks the lettuce is? +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..aa3c0ba614fe4a50312033a8924430dafa72db8e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_17/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Mila think Emma thinks Liam thinks the lettuce is? +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a516469e3b3b7252343b061aa49d5a091d7190a6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_17/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Avery think Mila thinks Emma thinks Liam thinks the lettuce is? +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0d641f3275fb47598d427ec3ef9acbaae49fdf95 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_18/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where is the corn really? +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..15a33880e3a52c8ec10ac0fc26b3b0bc694a1bd8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_18/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Benjamin really think the corn is? +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1a389567024cc274299fad785baa43dfa71344cc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_18/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Jackson think Benjamin thinks the corn is? +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..679d7c8fd3fe8a25fefe3f10c3b99115699deafb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_18/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Liam think Jackson thinks Benjamin thinks the corn is? +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1adcf20889763819e1de05dbfb65fab69c4e4180 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_18/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Charlotte think Liam thinks Jackson thinks Benjamin thinks the corn is? +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..dc739ef01de69ce0112e17bafc6979ef92e1de5c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_19/order_0.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where is the asparagus really? +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f216682e04484b4fdad31f9e5d1a6cdabaeba290 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_19/order_1.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Emily really think the asparagus is? +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca234f757d5f4b7e346486cd112b2aa9e46bce43 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_19/order_2.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Hannah think Emily thinks the asparagus is? +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a2406c4bdda12a37f40018898cdd482b22bf0357 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_19/order_3.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Amelia think Hannah thinks Emily thinks the asparagus is? +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b757551c8a4d94a8ec7183da44aefaea083ba1ad --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_19/order_4.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Abigail think Amelia thinks Hannah thinks Emily thinks the asparagus is? +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..639fab284601a59a9df9ad8d9416b87bcc912a7e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_2/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where is the tomato really? +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e3d05354de497d19a6abbc0c26140efe8b106fc6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_2/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Jacob really think the tomato is? +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ae6b0481b0164d5f20b2a84a3344238f98fa8f2c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_2/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Hannah think Jacob thinks the tomato is? +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ae8f1062b0962de2b6b6de2f2cf1e4039a23a485 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_2/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Isabella think Hannah thinks Jacob thinks the tomato is? +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b2627cf463f5b3ad65266b49fd922a6455bce69 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_2/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Elizabeth think Isabella thinks Hannah thinks Jacob thinks the tomato is? +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..10657a43874b83587ea2680b86369fbd5ba6ff49 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_20/order_0.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where is the watermelon really? +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..81e0b4ea632b8f28429e101bebdb58812dc7f717 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_20/order_1.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Ava really think the watermelon is? +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7465a5c4da769f7e93059e528a52c462800a6544 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_20/order_2.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Jacob think Ava thinks the watermelon is? +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4b8bad48baf8483ac9769ea1173b9cf34d604d43 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_20/order_3.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Emily think Jacob thinks Ava thinks the watermelon is? +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9355b42a75bd3b41c5213122c0584be833f22705 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_20/order_4.txt @@ -0,0 +1,19 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Evelyn think Emily thinks Jacob thinks Ava thinks the watermelon is? +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..046dd44c8bd521894b81d3fec82f773bcb9478db --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_3/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where is the eggplant really? +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fae637e6a7c84140932326c5196e3e62655f0255 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_3/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Noah really think the eggplant is? +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..cb0842aae515f3d6f0a9f00a8d02ecbe4f65ec6f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_3/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Hannah think Noah thinks the eggplant is? +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cfa5e9476aca8c362897971bca46369e80b1ef3b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_3/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Jack think Hannah thinks Noah thinks the eggplant is? +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4c78f9853aea7885f3a26d0704ac82f1c2784942 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_3/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Owen think Jack thinks Hannah thinks Noah thinks the eggplant is? +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1c570723683047bd4944755053345ae6e2ece19d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_4/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where is the spinach really? +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..866ddac2b69fd6e314a8f0e3a70cbb6088629859 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_4/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Noah really think the spinach is? +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f2596bcecf460dcff2a8a8d9e6b0c40faa2dc0b3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_4/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Mila think Noah thinks the spinach is? +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d7851aaa6162d4f6a30212c4e3efed29b0de6bc1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_4/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Emily think Mila thinks Noah thinks the spinach is? +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8a7ab9d8198e8b6d7e1c67608a389d887ec309d9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_4/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Evelyn think Emily thinks Mila thinks Noah thinks the spinach is? +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b12cde8d5ebd2a30a1dbac5cc62705edfb2bc222 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_5/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where is the potato really? +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2c67c8a865e9faa0f9b7b33d89951591e5124181 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_5/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Logan really think the potato is? +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ea993fc8f9cf3086934fe93c593290f0a257e8d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_5/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Benjamin think Logan thinks the potato is? +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..203db88b3651a9f81e8496a4ca7742723d42df7d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_5/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Charlotte think Benjamin thinks Logan thinks the potato is? +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..04c85bee4b083268472c7ce056fb0ebdc17ef6dd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_5/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Hannah think Charlotte thinks Benjamin thinks Logan thinks the potato is? +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6d32bc772951365447bac4c47498a9125ce5a1d7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_6/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where is the apple really? +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5ed3ce2f0bb3a4eaf403c1c0bc6662e569d4384d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_6/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Lily really think the apple is? +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..16019d92f88f6486a2ee04483b11c954064c0a12 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_6/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Hannah think Lily thinks the apple is? +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a858f60a4d024c0ca3cbe1d01aea64339fa232d9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_6/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Jack think Hannah thinks Lily thinks the apple is? +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..720e255b2582fa29c953129c38347583b392088b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_6/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Aiden think Jack thinks Hannah thinks Lily thinks the apple is? +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8af76b2776ae6a134d2e7701c1ecd31bab035052 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_7/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where is the spinach really? +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9cd49da9e6a192d878b9f7b3c2bd6b28c7ad3d6c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_7/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Emma really think the spinach is? +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..86dac1d70fe57facabc2d7041569a736b1cbe696 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_7/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Ella think Emma thinks the spinach is? +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..44314a6090c0202f8fdb31946cb0b70f9e8b7503 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_7/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Aiden think Ella thinks Emma thinks the spinach is? +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0504be22e121cc08cffa1ab548ae501efa8186e4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_7/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Benjamin think Aiden thinks Ella thinks Emma thinks the spinach is? +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..41ea790bdd77260f956d1c2d7b1733d6f0d32670 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_8/order_0.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where is the corn really? +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b4449af84ad13d96f6cfe27f52686e9b945c075a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_8/order_1.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Sophia really think the corn is? +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..40dfe562f2b479e92dddebf3ef5b9ebed1e672b3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_8/order_2.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Chloe think Sophia thinks the corn is? +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f75095364d60de3ddf0448e56803e69aab66f16b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_8/order_3.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Ella think Chloe thinks Sophia thinks the corn is? +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..22d8c80b6769dff9f470741c7f6505b3dde22b18 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_8/order_4.txt @@ -0,0 +1,20 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Owen think Ella thinks Chloe thinks Sophia thinks the corn is? +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..af7af764bee2928060d974b4672473d9e1615caa --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_9/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where is the banana really? +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7950950d2555ef7f80aea6702d7a956569fe0f68 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_9/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Abigail really think the banana is? +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f99dc93077346d0146aa1597acfb3fd9e657080a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_9/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Ella think Abigail thinks the banana is? +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d22a7edce2043fd5e54f9abb7baf2b26435d1a0d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_9/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Elizabeth think Ella thinks Abigail thinks the banana is? +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a0a8b5d1832dbe5d04f078bafd682863efaf1865 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_1/sample_9/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Owen think Elizabeth thinks Ella thinks Abigail thinks the banana is? +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c1a51771283299ea8ad1c0f78c382922ecb9c020 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_1/order_0.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where is the cucumber really? +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6857c0be9bb728827f895139e9ca78667df77f72 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_1/order_1.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Evelyn really think the cucumber is? +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1e7641af22382efb3b3b48c3f3d1c42ca458d697 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_1/order_2.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Ava think Evelyn thinks the cucumber is? +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5f213d33b86325b0e7677d786da8d4df0377fde --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_1/order_3.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Charlotte think Ava thinks Evelyn thinks the cucumber is? +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..af6eb48c5bf6eb87cbbafae12664c0009e756030 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_1/order_4.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Jacob think Charlotte thinks Ava thinks Evelyn thinks the cucumber is? +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1e1696e0abf97089373f661fa663d5049ce8aadd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_10/order_0.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where is the orange really? +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fa9d1a5814b09e9da27e68b2f0a02660d8a321c9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_10/order_1.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Hannah really think the orange is? +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3c566d6e62ee88b782136485f0a1b0b676cd8c88 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_10/order_2.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Aiden think Hannah thinks the orange is? +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..bf4be321d769047c5e12e5df72e48169c2301da9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_10/order_3.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Jack think Aiden thinks Hannah thinks the orange is? +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..17c451444950947445350a09a541678197d92dd9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_10/order_4.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Alexander think Jack thinks Aiden thinks Hannah thinks the orange is? +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7cd4e1a36cdc8854794472cc568921de1225aa0f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_11/order_0.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where is the cherry really? +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..dcccf9bdb0d8fa6f820e5950a2abfd33eadea9df --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_11/order_1.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Avery really think the cherry is? +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..41066ceab111c454a8ac8e181b12cc2d97d2e724 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_11/order_2.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Lily think Avery thinks the cherry is? +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b83d5cd8b891232c51a565ea35e74e887a614894 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_11/order_3.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Ella think Lily thinks Avery thinks the cherry is? +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6e5df1424f546ed090809bdadda1be07b5aa91d6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_11/order_4.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Emily think Ella thinks Lily thinks Avery thinks the cherry is? +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a99706b772f97ffda457b0af505c0b2372f30f64 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_12/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where is the pear really? +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fd095c12bc348d09ec39fba1d87f72a439e8ea73 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_12/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does Charlotte really think the pear is? +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..0a280326ab1c448556f6f7d0c8d269e4bc35e0ec --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_12/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does Alexander think Charlotte thinks the pear is? +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..04654c0ae0acd8086f2973c1d91b25e54d5c19e7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_12/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does Ava think Alexander thinks Charlotte thinks the pear is? +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..853d7e7eab4291451b1be7b96f9199a994d179e0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_12/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does William think Ava thinks Alexander thinks Charlotte thinks the pear is? +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..cb9c5e276b5615d0a0e7818654aeed9857c0e4b2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_13/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where is the watermelon really? +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e14714aa8cf00bbf65b9d2dadedf1a370bd063e7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_13/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Carter really think the watermelon is? +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..86013e14ec19c93c9d593fcf03646668e1e9d40f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_13/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Avery think Carter thinks the watermelon is? +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2f0c6433b68c02b111118dfeb8cf5ebf4901b1db --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_13/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Isla think Avery thinks Carter thinks the watermelon is? +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4850e87aac348f6d8681d73ab15a5ed310adc8d9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_13/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Sophia think Isla thinks Avery thinks Carter thinks the watermelon is? +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..441ac5006121d61ca0823512f27c7d5dc3f2548a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_14/order_0.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where is the lemon really? +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1d72212590b94ff872b4c15fe1299b2c8b357798 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_14/order_1.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Isla really think the lemon is? +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..cb6e4521e1c60736754d3333b6db568ea53d0aaa --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_14/order_2.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Sophia think Isla thinks the lemon is? +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2000bdc9ea21872b6ee6346765f269e2950a4ea6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_14/order_3.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Evelyn think Sophia thinks Isla thinks the lemon is? +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..026ee898aaa7448addab7280f3c9ae716892f569 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_14/order_4.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Alexander think Evelyn thinks Sophia thinks Isla thinks the lemon is? +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..cf9cc9a1bac0e9c4e08a83a6afb6ca973258fed4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_15/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where is the corn really? +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2792105bdf67ded278a45998c62f60589ddd7d34 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_15/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Abigail really think the corn is? +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b1165861109ac519bf8a6bcbf77952134b0bb609 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_15/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Nathan think Abigail thinks the corn is? +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..192af91e593bf639cf9ca56a04f0a3a5781379a7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_15/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Avery think Nathan thinks Abigail thinks the corn is? +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6b77aaa2d83d0eadc9b1ace5b6106bac08b85e5e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_15/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Hannah think Avery thinks Nathan thinks Abigail thinks the corn is? +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..58fbc14211721333716284255059d07ed1e68d02 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_16/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where is the tangerine really? +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f82d07727cfa26927324cb7a50f48063ac215aa4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_16/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Benjamin really think the tangerine is? +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..82e33875d69e2ea6bccfbae1751365c25e984559 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_16/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Liam think Benjamin thinks the tangerine is? +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7755fc7d4e4e33bedc363acbb04c68642e9c21d6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_16/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Carter think Liam thinks Benjamin thinks the tangerine is? +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..60747ea6c650bc539e2189346df8379b3078f9a4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_16/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Jackson think Carter thinks Liam thinks Benjamin thinks the tangerine is? +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a8c02f8f3ef96a107e47c019597c78a44d05d633 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_17/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where is the lime really? +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..01710f2bb31323180f2421485cc5d31d62634586 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_17/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Owen really think the lime is? +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3afba99271020c79ef0472c01059f3142d851495 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_17/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Emily think Owen thinks the lime is? +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1ed848e984a9ec3c87bb04d94ca32bdb21929db4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_17/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Lily think Emily thinks Owen thinks the lime is? +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f041b83bc85bef1f4fe6ccfb30c9d2b93226ce65 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_17/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Ella think Lily thinks Emily thinks Owen thinks the lime is? +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..150c173b24c7b0524095289ec2f5a8dabba60685 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_18/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where is the corn really? +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a96cd07dd74f6ba07e803dc847b880417abb21fe --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_18/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Noah really think the corn is? +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..18ff8faab13dcd346bbbbe4eecbf629aae1c2d0b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_18/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Lily think Noah thinks the corn is? +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9c64614c4cfe40656ad61dbfda672b1f328b5203 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_18/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Isla think Lily thinks Noah thinks the corn is? +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..303ad0c246723bfe4a3938f180f18f6325af5fb1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_18/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Mila think Isla thinks Lily thinks Noah thinks the corn is? +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..517df87778439918dc36ebaeee0d2b2e44846277 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_19/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where is the tomato really? +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d69279b4ccb4e080b6c49bf1779eb7fb5202e8c4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_19/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Jackson really think the tomato is? +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..618143953debf9ef280b38928d2d70c635c0f1cf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_19/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Nathan think Jackson thinks the tomato is? +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2279e2d076dcf79d53421831734057ca5b05ffbe --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_19/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Amelia think Nathan thinks Jackson thinks the tomato is? +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..619e3e64b98742fc8cfa91ab36390c8142024136 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_19/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Sophia think Amelia thinks Nathan thinks Jackson thinks the tomato is? +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c58e86b66ce681eac4018481013e26b7a690ab27 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_2/order_0.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where is the corn really? +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4b23be55aaf4c0c61854ffe460d0a7f849e2cbd7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_2/order_1.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Amelia really think the corn is? +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b4e67a398dd711008a81233d3c8fee6fdd3e50b7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_2/order_2.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Lily think Amelia thinks the corn is? +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4c1dca551bea18f4d6c68b6806066eb6b5280ecf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_2/order_3.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Sophia think Lily thinks Amelia thinks the corn is? +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..bc5bacf47c09a8e98e818ace45148a98ec04d6cd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_2/order_4.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Liam think Sophia thinks Lily thinks Amelia thinks the corn is? +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..124773d3303e5ef972eb30f20ae6758aec5c9295 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_20/order_0.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where is the peas really? +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0e5b88e645a7eb9f343100eefaccc63a273aa8b2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_20/order_1.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Nathan really think the peas is? +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4c0c42023207a856d3596a54d2149d6831fa7a27 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_20/order_2.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Emily think Nathan thinks the peas is? +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1bc545512d469d9f61ff5ee8e3aba5657c90cce2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_20/order_3.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Ella think Emily thinks Nathan thinks the peas is? +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ff743f3b6c2b6f08e76c281391a1be6e089e607f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_20/order_4.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Evelyn think Ella thinks Emily thinks Nathan thinks the peas is? +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3128e2c3dd08a90e7f9dde7db64d58b439e4bb4b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_3/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where is the peas really? +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3ed723df76ee0662de7e6896701fdb21d439ca4d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_3/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Benjamin really think the peas is? +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ce41e0f29976bb4a7dff06a1a1717659fb29691b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_3/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Noah think Benjamin thinks the peas is? +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..aa7278116af4bef5d2cbc2be19107249f230465c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_3/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Liam think Noah thinks Benjamin thinks the peas is? +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..45f4f4e4b1b900a47be81a1b32bb7292543d4603 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_3/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Avery think Liam thinks Noah thinks Benjamin thinks the peas is? +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..cbbdea38d54fc49efd15d2877b8225bc08d7e934 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_4/order_0.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where is the potato really? +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2bee2809aa125d591970eef4b6a738fc28e7f2d1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_4/order_1.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Isabella really think the potato is? +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..11033a49d0ea6ebd40996815fd58a93e26119b9e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_4/order_2.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Chloe think Isabella thinks the potato is? +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..575a7aed98ca8b27989dba908d5f8ba07808a6c0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_4/order_3.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Evelyn think Chloe thinks Isabella thinks the potato is? +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ad180ace01306c5f54a9672a21e988f7c16e564 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_4/order_4.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Jacob think Evelyn thinks Chloe thinks Isabella thinks the potato is? +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3693d59439331166a312a1083861d26de5d8e792 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_5/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where is the cabbage really? +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..788cac4e79eb04de46992ca055643d82890367ed --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_5/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Avery really think the cabbage is? +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..68dcc180695dc737c1016c04467b65135b1952fb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_5/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Aiden think Avery thinks the cabbage is? +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..47c04a6f36cee6c34418df95dd05db2c4dcc7bdf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_5/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Emma think Aiden thinks Avery thinks the cabbage is? +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8722f67337f5c3a21d634ee7bd9d4aaeace0f46f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_5/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Noah think Emma thinks Aiden thinks Avery thinks the cabbage is? +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1e281136345c3808ebd5b74f681031d07dc2731e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_6/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where is the melon really? +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f96a697a8d90808f823f979cfe7aa391d69735c5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_6/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Owen really think the melon is? +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1f66962964503d767d1ff7cae491b7e500d5de36 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_6/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Avery think Owen thinks the melon is? +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b2edfef833de035378b54ac95f8c5b434e9e30cc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_6/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Benjamin think Avery thinks Owen thinks the melon is? +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9a4bffef8c013553c469aa991964e088af5fbff4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_6/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Noah think Benjamin thinks Avery thinks Owen thinks the melon is? +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7c29079f80db9a31c7a6fba5799da64476d184da --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_7/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where is the melon really? +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..da33bb2a194f18d2270482a6be10e158076e9b79 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_7/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Nathan really think the melon is? +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8850b0075968541a2ebe1d43c13a37d54d5c749c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_7/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Lily think Nathan thinks the melon is? +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..31734361d5536d3363d6e3e1d836dbcc0cd8fa9c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_7/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Isabella think Lily thinks Nathan thinks the melon is? +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..25888489504feb6f6ca6ab5daa90609beea05a4c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_7/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Ava think Isabella thinks Lily thinks Nathan thinks the melon is? +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e03b5dab24be773a151583df98721b8faf1eac2f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_8/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where is the watermelon really? +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..30de6418fd6d980be9cc6f0088adcec3bfea86ac --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_8/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Noah really think the watermelon is? +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a84c73b0429de28b66ae2b91f8ac5fe33159ee75 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_8/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Emma think Noah thinks the watermelon is? +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..3aa78caa96551f4e30b3b23e3a1fd6c3d3b3592a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_8/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Liam think Emma thinks Noah thinks the watermelon is? +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b5e1b820c8fdc294244ebf4ed65b9d69667fee0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_8/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Owen think Liam thinks Emma thinks Noah thinks the watermelon is? +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f84df285f54d3f2508f827f1bdfa5deb55c00865 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_9/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where is the carrot really? +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c34618e0a10b01138e6da062168fabc9b6063212 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_9/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Noah really think the carrot is? +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8b1b3de95924d04ac4194312c2169129b9a637a7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_9/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Owen think Noah thinks the carrot is? +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ea1c11cf8ab0d2736f84d63ad3cbe545ab876829 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_9/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Mila think Owen thinks Noah thinks the carrot is? +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..807a108a606eb9a07ff4d859899092a422dbe667 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_2/sample_9/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Lily think Mila thinks Owen thinks Noah thinks the carrot is? +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..cbee35d50e6ef42b5d5d0f25d800831ba4b87883 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_1/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where is the lettuce really? +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4b5c361b4f27ea9551c978f0a888c6f4ba4bbe65 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_1/order_1.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Isabella really think the lettuce is? +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..78d5b0ca38753f0f84025d567fe898ab88251287 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_1/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Abigail think Isabella thinks the lettuce is? +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..eec3eb9702fcb51fae2cd7321f734597434ab734 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_1/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Nathan think Abigail thinks Isabella thinks the lettuce is? +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f85b808a66c2277cdd040ad33f66a1bb4d37e99b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_1/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Logan think Nathan thinks Abigail thinks Isabella thinks the lettuce is? +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9e06b796697d8383f06fc95ca41705ad1834fe9b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_10/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where is the sweet_potato really? +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..de55370ec649fbcf83d35ebffb05aca8274eab50 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_10/order_1.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does Evelyn really think the sweet_potato is? +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..0ddcccbb5a1ad4353a35cd68a08543baa21c4b22 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_10/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does Logan think Evelyn thinks the sweet_potato is? +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..21103f762b8c23ffeb3b68da380cd8296da5a88e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_10/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does Charlotte think Logan thinks Evelyn thinks the sweet_potato is? +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..54ef7865cc3a5b105d7f55a0d04b869a5b742da7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_10/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does William think Charlotte thinks Logan thinks Evelyn thinks the sweet_potato is? +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..826f515bd01bab276653db9ccd154520f1262b64 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_11/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where is the melon really? +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..442de3e721e81202eef4db959c45d4b93ce272c1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_11/order_1.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does William really think the melon is? +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..fc388deff5f3261871bb884eeaf25087e7213b37 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_11/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does Lily think William thinks the melon is? +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5b1b3781896e05fceb9b9abfdf26b01328a04a78 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_11/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does Emma think Lily thinks William thinks the melon is? +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..951cf33a4dedda6987a59aa6cf9409ab64d2318d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_11/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does Isla think Emma thinks Lily thinks William thinks the melon is? +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9879512cac990fe24949441160ca673b354b7a02 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_12/order_0.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where is the beans really? +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1939ffbecdfa714963fc00a9faf998232f585f7c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_12/order_1.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Jack really think the beans is? +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b46970278016a4a4c0e4196a023c4ab90c578056 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_12/order_2.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Owen think Jack thinks the beans is? +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..bcb8449db26721287707023d7e4f28de443b3269 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_12/order_3.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Liam think Owen thinks Jack thinks the beans is? +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..dba424bcc3e94fb583778eb3f0ae65761b11408f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_12/order_4.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Benjamin think Liam thinks Owen thinks Jack thinks the beans is? +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2407b0c4498455b30afac6304951be069104f369 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_13/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where is the corn really? +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a3172d7e11a3f3787040e33f5ee0dd40d1ac2e09 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_13/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does William really think the corn is? +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4978a89b454afe0f71e483447b60c42bc943a3b3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_13/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does Emily think William thinks the corn is? +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e9709fb23fc4e317905d3706f52001bab173f82e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_13/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does Emma think Emily thinks William thinks the corn is? +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b9eb7b2e3a88a2820545930a3020b283de8ac346 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_13/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does Jackson think Emma thinks Emily thinks William thinks the corn is? +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9327964938beb381e02f5e131e7f34a5b6e79e99 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_14/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where is the cucumber really? +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..aad3825de6a118b093e1041d25dadce1fcae61c3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_14/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Avery really think the cucumber is? +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..66799b97149ffb3498cf27f9c37501830588a292 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_14/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Abigail think Avery thinks the cucumber is? +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f0f9e8b78d7d88686728409d1177a778a6ce805e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_14/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Hannah think Abigail thinks Avery thinks the cucumber is? +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b9274f8f1895ce7af8eade5769bed895b02c3c0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_14/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Owen think Hannah thinks Abigail thinks Avery thinks the cucumber is? +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..cf5a68b2c63fdd38cb9b9836dd38e9fb17de3f65 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_15/order_0.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where is the sweet_potato really? +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e6ddb5755ebeebab3101965d81e5cdffb7976a21 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_15/order_1.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Jacob really think the sweet_potato is? +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c10abf22d695e53144f7ef1e877fedcb25a659a0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_15/order_2.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Aiden think Jacob thinks the sweet_potato is? +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..31ac6ffaa21df3bd0021c5466944a61e61052785 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_15/order_3.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Mila think Aiden thinks Jacob thinks the sweet_potato is? +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..066250c4336573d0f508f124e60eca42c7333246 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_15/order_4.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Elizabeth think Mila thinks Aiden thinks Jacob thinks the sweet_potato is? +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e50bb4e2f5379ae0b75161bf85ba6ced43c52315 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_16/order_0.txt @@ -0,0 +1,39 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where is the persimmon really? +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1e5c0243a2190dfa41365c6a13243f2dae3ada3a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_16/order_1.txt @@ -0,0 +1,39 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does William really think the persimmon is? +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d007f9616b3c512ef94d0249d828e53aacc35cf3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_16/order_2.txt @@ -0,0 +1,39 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does Hannah think William thinks the persimmon is? +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..87ad7613e53fc863759a4673cd7d80de46fa20d6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_16/order_3.txt @@ -0,0 +1,39 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does Avery think Hannah thinks William thinks the persimmon is? +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..09f3b7905f33a2d48bb394a9ae124d6cdb769d8c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_16/order_4.txt @@ -0,0 +1,39 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does Alexander think Avery thinks Hannah thinks William thinks the persimmon is? +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a0bf429831395bcd116411b8d6bc747806ee83e5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_17/order_0.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where is the eggplant really? +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..634b2c0890b722c563c79bcd4c2598e688a439b3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_17/order_1.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Emma really think the eggplant is? +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d8e6b20ed39c83c96266c7daf0c3fdd377e67330 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_17/order_2.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Jackson think Emma thinks the eggplant is? +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2357d111a69c405c336aa69ea3541f194dfc8e43 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_17/order_3.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Jack think Jackson thinks Emma thinks the eggplant is? +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..379de7b33b9e76920e9b5a17bd4df9376e3a5edd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_17/order_4.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Emily think Jack thinks Jackson thinks Emma thinks the eggplant is? +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e85cc22217d2819e6238676acd54bb6f74351b8c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_18/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where is the lime really? +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a6b1df5c22c014ba9a44b9715d428c7070e91f1d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_18/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Elizabeth really think the lime is? +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e0e4abc2370255466d8e034d8a3a172155be34df --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_18/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Alexander think Elizabeth thinks the lime is? +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4adb6f3bb028c38bf54cf8888da61bd32a1b050a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_18/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Owen think Alexander thinks Elizabeth thinks the lime is? +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a816203a0cffe282fb032274d3123622c7f7e892 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_18/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Nathan think Owen thinks Alexander thinks Elizabeth thinks the lime is? +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..be79647685e6d477af79e2cfeb57dbd0abc2d530 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_19/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where is the pear really? +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..16e8c1c2ca4de276e7c17ea8c3023a4181bc98d0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_19/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does Noah really think the pear is? +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..51402c5428d6808237d1803d8beeb3ec20c96756 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_19/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does William think Noah thinks the pear is? +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..671e72d776729ec8c873741b145b4d7d8ec2ea78 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_19/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does Isabella think William thinks Noah thinks the pear is? +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9975223745a50d8b3233eeae0fe6a205eb78d48c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_19/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does Aiden think Isabella thinks William thinks Noah thinks the pear is? +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6a6fd1a4c80f9e1ba93f613e8a4fb0bfa96b48f4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_2/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where is the onion really? +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..af53aa276eaa11d14e84e868f6f80b887fa7ec81 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_2/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Nathan really think the onion is? +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2e507776d514bb8c7cfb3a43c00f6867f8f78f49 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_2/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Emily think Nathan thinks the onion is? +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6097ead0c141dea1e098a777fcc6c10e6052d06a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_2/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Owen think Emily thinks Nathan thinks the onion is? +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c9be002f0a5d1cfa246f770dd9c13522d49d2da --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_2/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Liam think Owen thinks Emily thinks Nathan thinks the onion is? +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad7867cd716cb4a2c2ac91c29753ec520bff2f36 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_20/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where is the spinach really? +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5bfca84a2c52d1c92fde93c9a63717e92e4a75b3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_20/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Evelyn really think the spinach is? +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4ebc11cb0e5c5d674f82930333c115673eee883b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_20/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Jackson think Evelyn thinks the spinach is? +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8681643629a0343b6cf5c9208230cca744024e78 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_20/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Liam think Jackson thinks Evelyn thinks the spinach is? +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d6221b45ab4ceea09cfe8b9efe04976e1ae20f8b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_20/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Elizabeth think Liam thinks Jackson thinks Evelyn thinks the spinach is? +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..35b167eda5cf93e0cb0fbce7d598761cc5d62448 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_3/order_0.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where is the peas really? +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..be87c9454f6cf6d5da53dc818602e743bd127116 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_3/order_1.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Isla really think the peas is? +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..02d25a2589ccb058811c96db7e316e7f4fd4569d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_3/order_2.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Amelia think Isla thinks the peas is? +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f6ba443d5251b548fe38cfe9942077a2e9ca551 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_3/order_3.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Carter think Amelia thinks Isla thinks the peas is? +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..fe3d6ef76c4bd480f1196f0e4b6bf1e26b24eb8e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_3/order_4.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Mila think Carter thinks Amelia thinks Isla thinks the peas is? +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..831d90f8c22daf514931c5ec046db9d4b5dcee0e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_4/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where is the green_pepper really? +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ed4e25cdf4763f38ef9f4e29ff160e669b58e200 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_4/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Emma really think the green_pepper is? +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8fdd1ca4874ea24647970dad96cdf5e975a9d017 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_4/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Benjamin think Emma thinks the green_pepper is? +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..0b3abfb8206843e97a758bec8512341d7e40962e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_4/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Jackson think Benjamin thinks Emma thinks the green_pepper is? +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..940e6c0deb7367e054b8403485be41caefd14cf2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_4/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Abigail think Jackson thinks Benjamin thinks Emma thinks the green_pepper is? +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..908f81e3c4de452d3d2dece14d1a01e3af6a6d1b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_5/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where is the peas really? +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2e76bead7163e1e1b0bfc60d92ce5163fd2a142a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_5/order_1.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Hannah really think the peas is? +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f647f3f2fb7af8c24199694d21bd25e27a31532d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_5/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Amelia think Hannah thinks the peas is? +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..de2d9f00f80f25b0e7f1911535fe6fd7a777211f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_5/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Jackson think Amelia thinks Hannah thinks the peas is? +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b31557b7159d89d0065e0a921acbace3b947476b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_5/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Abigail think Jackson thinks Amelia thinks Hannah thinks the peas is? +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e4a57368ea4ae557f321bf5a4cd8388f10c95a94 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_6/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where is the turnip really? +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..89fdde0609b94eb234f02b3983fec0ef7a39a2f8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_6/order_1.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Hannah really think the turnip is? +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f4d029612eafde8a83bfb1aa71ece590d306502e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_6/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Lily think Hannah thinks the turnip is? +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8959690947ee59891e5fc71b8c073270ef1305ec --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_6/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Noah think Lily thinks Hannah thinks the turnip is? +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7f36dd46e71ade233872d264cf3ec59755829c4e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_6/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Logan think Noah thinks Lily thinks Hannah thinks the turnip is? +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..97221039752678d00fe45320a43993c149e28d5f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_7/order_0.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where is the watermelon really? +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c9bd5504cfa79db6d5243844af2c30ef34cc2f18 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_7/order_1.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Evelyn really think the watermelon is? +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..10e0e2c24516ecb93c6dd71ad67d0693bffabe5d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_7/order_2.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Logan think Evelyn thinks the watermelon is? +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9e94faede2f19c6dcd97750874daccba262b34bf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_7/order_3.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Chloe think Logan thinks Evelyn thinks the watermelon is? +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d6efa28b12235878659297cef0492b57a7b02675 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_7/order_4.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Charlotte think Chloe thinks Logan thinks Evelyn thinks the watermelon is? +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a033b824ea34cf709c92f97bdbc71d98c93a35f6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_8/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where is the lemon really? +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a1dbd529bbd962117c73dfe894666a32f8564fc7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_8/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Aiden really think the lemon is? +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc4a1982abbf7f6c2172031e421e20e6f3da553c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_8/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Nathan think Aiden thinks the lemon is? +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..299750f4998a99de4d1574346fdd2f957d79bd0a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_8/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Jack think Nathan thinks Aiden thinks the lemon is? +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7de08c528dff5359503cfbdbef08142bdf36d238 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_8/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Liam think Jack thinks Nathan thinks Aiden thinks the lemon is? +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6e89d8235894cad7ec096eabff0ea7f2ab59789b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_9/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where is the cabbage really? +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2de2572d61a9015334300a3cc0e5320975abf579 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_9/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Isla really think the cabbage is? +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a2ff94b75bbcf0b4ff4ac78c2f0201265bae5a89 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_9/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Elizabeth think Isla thinks the cabbage is? +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..de303b83de3af65e9d917fa788cb472da82eeb94 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_9/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Abigail think Elizabeth thinks Isla thinks the cabbage is? +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ed94c213d326137f04e9e258507cc448ce5fcc29 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/No_Tell/MC/length_3/sample_9/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Aiden think Abigail thinks Elizabeth thinks Isla thinks the cabbage is? +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f8c1bc8317e77d5f7a1edc4519e05fb8cde81841 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_1/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where is the carrot really? +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7a71d68fdb252b72ffcfab409a3b832b1883f6b8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_1/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does William really think the carrot is? +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1bb75290ee5349908059d646e7a9692b38f721bf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_1/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does Hannah think William thinks the carrot is? +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d2bc9f7263c354062376718f929a418891ef5156 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_1/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does Jack think Hannah thinks William thinks the carrot is? +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..126e7ba0e4f0535e536cf76291aef8ac57d81517 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_1/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does Charlotte think Jack thinks Hannah thinks William thinks the carrot is? +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..341d678aeb510c12478bca1e5e3e69e3d5fa2ea4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_10/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where is the potato really? +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8cb946c90cfb29ede6fff2e31085541d6f31b1ee --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_10/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Carter really think the potato is? +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7f9783f92b919aebf92bcb30b488680b52e07eb7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_10/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Jacob think Carter thinks the potato is? +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..0469fe0aa9944b230487d79928a070ea20e190d8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_10/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Alexander think Jacob thinks Carter thinks the potato is? +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a17d3625d5bd5366080dffd981f0fe9e87131695 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_10/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Jackson think Alexander thinks Jacob thinks Carter thinks the potato is? +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4451867cff643690dcf19bd68434bf87572da71e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_11/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where is the pear really? +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2c5ac713f4de6ce9a17b04cc939a3ca2431013d0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_11/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Sophia really think the pear is? +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..72fd13eb9a4e2a0a2e239b7fa88a7aa2c36fb49b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_11/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Ava think Sophia thinks the pear is? +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..58564fd10a43c2bee3390a1b8bd23d188cda3704 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_11/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Avery think Ava thinks Sophia thinks the pear is? +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a53dedae8b11655ebec65adfc4f6e2f35321dcbd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_11/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Mila think Avery thinks Ava thinks Sophia thinks the pear is? +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b925ed579fcfe8a6316a4535ce3363bddd8fd0b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_12/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where is the tangerine really? +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b2d08dae729e886481aa2ea4b6deaceeb8e13a30 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_12/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Ava really think the tangerine is? +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc0e942bf205fd2cf1b3f3d1b3977ca7aa6ef7bc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_12/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Logan think Ava thinks the tangerine is? +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f550396dd7da4ad1b6268308f11ce17ca8610efd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_12/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Owen think Logan thinks Ava thinks the tangerine is? +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..72c1596b5045946dab8ef60fe48e60b8703a2e72 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_12/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Elizabeth think Owen thinks Logan thinks Ava thinks the tangerine is? +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..61cf5648395724d8b8ff6c87c29aa16740b05ec4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_13/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where is the onion really? +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..51cf532d564a7fa9da5f8b9a170f81f9b55aaf50 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_13/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Owen really think the onion is? +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..aca2fc08d78897af24ff2dc6b9671a84f8bba3d4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_13/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Elizabeth think Owen thinks the onion is? +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4578f21ecd43348a98f2cbbf2b8481bb54ee751b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_13/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Liam think Elizabeth thinks Owen thinks the onion is? +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3d13be255dcff0704ecf4ac2a88922e05b924cae --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_13/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Noah think Liam thinks Elizabeth thinks Owen thinks the onion is? +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..164056d20762503c1d576d7ea7f6697337f46c9f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_14/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where is the tangerine really? +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b6b183cc8de924a58893afc50644303c74385895 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_14/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Mila really think the tangerine is? +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ce2838225c5645e7986e40694c28f8acf6473d55 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_14/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Amelia think Mila thinks the tangerine is? +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..313b51e6837eea08d394b21149eef44ea1dd314a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_14/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Elizabeth think Amelia thinks Mila thinks the tangerine is? +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c3f92fd374fb6b17724283981bba487f29fa1802 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_14/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Chloe think Elizabeth thinks Amelia thinks Mila thinks the tangerine is? +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3f4fdd9465d61f293eac703615b2f51a46e6af9b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_15/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where is the tangerine really? +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4e9f333a64f0cf93662cd83c9ba45eb212f2ed40 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_15/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Amelia really think the tangerine is? +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..45614543f3c4d1c4bc9594fca46e1c469374dacc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_15/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Ava think Amelia thinks the tangerine is? +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1cdbc8e3b5885479940b1d20405cf1fa239ad209 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_15/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Carter think Ava thinks Amelia thinks the tangerine is? +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..053017f21ff32b4f097853adb16f783946c97ce5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_15/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Abigail think Carter thinks Ava thinks Amelia thinks the tangerine is? +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3331918f2c34f0a3ba4a9456142025e141b65e69 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_16/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where is the tomato really? +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a3080b6825244ef654d38849b29d4cbbab1b3638 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_16/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Jack really think the tomato is? +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..bab1f331b4d19b0e8d94e3b3349cc10fa3968ed3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_16/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Isla think Jack thinks the tomato is? +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a00e6783332acc601daafadc941a446a6b54a611 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_16/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Carter think Isla thinks Jack thinks the tomato is? +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..96f6e4fa1879cdfa5766c60a5bc6cad5d14c20ce --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_16/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Aiden think Carter thinks Isla thinks Jack thinks the tomato is? +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7bdbd15dc8d499fbe97226530e786f283997d302 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_17/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where is the green_pepper really? +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..51758e21b82a3924bd5379031931813e2368b835 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_17/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Alexander really think the green_pepper is? +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..06437410f95aab57006b503e2504f90cba9c3534 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_17/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Evelyn think Alexander thinks the green_pepper is? +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8cfe2e1bfd3d5de62d33190d0c52c705b287dd99 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_17/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Hannah think Evelyn thinks Alexander thinks the green_pepper is? +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad78b4b66104a72836b96978b4eb6ed7abfcc894 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_17/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Abigail think Hannah thinks Evelyn thinks Alexander thinks the green_pepper is? +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..cfe97fde13316e6cea62622c135872dc67a59e84 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_18/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where is the cabbage really? +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..37927d0dfb270331b37124e931aa969a636e79cf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_18/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does William really think the cabbage is? +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..117c13eec03c0c7f87fe96f4bc0636a12680181f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_18/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does Nathan think William thinks the cabbage is? +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..01d5aa83b5330a1ca820a14ab2cbf59799996a5c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_18/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does Aiden think Nathan thinks William thinks the cabbage is? +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..61a135657b7a9ac7986e4fcd083bccfbde0e93fd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_18/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does Logan think Aiden thinks Nathan thinks William thinks the cabbage is? +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8c68455cd37bfa849d612964449566c433d04a9f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_19/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where is the green_pepper really? +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a5e37eaa3b143dc1a0b3d495826fa8f92a3324cc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_19/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Logan really think the green_pepper is? +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7e917de1c9d980bcbbc2b6a9d7e1d327a8b6ebeb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_19/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Lily think Logan thinks the green_pepper is? +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..aeff8f1965d1ff5856cae1d9124d2243f82cb255 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_19/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Ella think Lily thinks Logan thinks the green_pepper is? +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..de8febda98a49ab7eb5b5b1c8305c736895725a6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_19/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Elizabeth think Ella thinks Lily thinks Logan thinks the green_pepper is? +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..948c60e33dd1a1aac65c0e1a9f8bfd0bdfeb49c9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_2/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where is the lemon really? +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca5be90c863f16c9d7b4cbac1cc4e513c2904630 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_2/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Lily really think the lemon is? +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3ae5b8811674e087a018c33567babc866b645078 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_2/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Avery think Lily thinks the lemon is? +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..687d33d838bc31bb347abce8de965e6f2bed090b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_2/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Liam think Avery thinks Lily thinks the lemon is? +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..867c3a788a5088b052af87f82d711bd1507289f2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_2/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Noah think Liam thinks Avery thinks Lily thinks the lemon is? +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..eac1df5c0866e2dfdacdf4db97971dbc6761b2be --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_20/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where is the peach really? +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..001cb0385e4b654639daffee5361972e8e388b94 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_20/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Avery really think the peach is? +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5b3c4ab33c8c6b2186c5dba030549bb19e589ac3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_20/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Liam think Avery thinks the peach is? +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..21f8e0303f33100c61f6aed19a53c839b2ce0712 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_20/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Benjamin think Liam thinks Avery thinks the peach is? +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0750ae3780a7a010a1524904667f92003dca7edc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_20/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Hannah think Benjamin thinks Liam thinks Avery thinks the peach is? +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..614464694ebd64374af10af209af92ee08dd9c77 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_3/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where is the onion really? +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..31a664ab50a383da450deaaa828ec59bd29b28c1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_3/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Lily really think the onion is? +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8b6ad1512c94f8e195783781ff05688c273e7bed --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_3/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Avery think Lily thinks the onion is? +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..0200af0fe116f9d73af0c74b48a7a90db90bc7ba --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_3/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Emily think Avery thinks Lily thinks the onion is? +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..12b5491b64db920dcd8900f1cc8da71caf443025 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_3/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Elizabeth think Emily thinks Avery thinks Lily thinks the onion is? +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..eb9dd011b95c46b413c716c0a05ef7e0f7d82319 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_4/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where is the cherry really? +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3d5499fe794003da9216827f2c34dab8d23a5e7f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_4/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Jackson really think the cherry is? +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7e1fa454b6a1ad8be40cd1510b1d15c86cb9649c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_4/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Benjamin think Jackson thinks the cherry is? +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..20ce6e1323089bfbc42c96b19946edc67795b773 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_4/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Mila think Benjamin thinks Jackson thinks the cherry is? +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8d40342ea79f6b6e2729b6d7fafe0b7217a489a0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_4/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Abigail think Mila thinks Benjamin thinks Jackson thinks the cherry is? +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..dfeb5f1cb8b1f80ed6ee4b0358265fa853054ce5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_5/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where is the asparagus really? +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..db8a35c4f51ca7a709dc678839d9fd3b95e34068 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_5/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Logan really think the asparagus is? +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..eb955fe1b7e7fc4f16b9a4449f9c2030a2a995e0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_5/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Sophia think Logan thinks the asparagus is? +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..88377713aa1faa9f04fe6eac4540bfdfe989fe7b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_5/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Elizabeth think Sophia thinks Logan thinks the asparagus is? +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..01886704ef43a70979a95d1140588b726ad35f0e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_5/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Hannah think Elizabeth thinks Sophia thinks Logan thinks the asparagus is? +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2c816db8e6ebef00e622984981d9fdb1013b694f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_6/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where is the watermelon really? +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..02a6d2bcceef16f9bf8de86affb106a624313a6d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_6/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does William really think the watermelon is? +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7376f7c6a47f287f133d7bea54d971b38a80854d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_6/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does Carter think William thinks the watermelon is? +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..fa00672dc4adfc122f4ae838817f569de1a1565d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_6/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does Owen think Carter thinks William thinks the watermelon is? +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b7f843dc1fae14c11d01fcc2cb4b0a2e607cf441 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_6/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does Emma think Owen thinks Carter thinks William thinks the watermelon is? +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..aa496b54b7c8598733530368275984080fd9fb24 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_7/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where is the tomato really? +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..904d48044d147c981ae75006ef2a2ca6c7ec07c5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_7/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Emma really think the tomato is? +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f42a8e245cf4c899151af7b037a7311cb1bf9188 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_7/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Liam think Emma thinks the tomato is? +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..952a24e38c7b7bacb4de2f046c60e3de3864b6f9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_7/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Hannah think Liam thinks Emma thinks the tomato is? +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0b9bc315a4b5580d6865f837d9dba8f7c03cc003 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_7/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Carter think Hannah thinks Liam thinks Emma thinks the tomato is? +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..36e6eaca6db964dbb9497bae2526d0a42f2b6881 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_8/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where is the lettuce really? +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9cf13124b631a0d169ccdf8147142a8fd2bb707a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_8/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Isla really think the lettuce is? +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..0c6e805f4953a2fc56211bbc30e5a7a9f892664c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_8/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Benjamin think Isla thinks the lettuce is? +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..821c0b9e93e8f8cd75c61cdccc8eda3c3de965ef --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_8/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Sophia think Benjamin thinks Isla thinks the lettuce is? +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..953dfe7189b19860dc6d93d682fc2d220b3fdd0e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_8/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Emily think Sophia thinks Benjamin thinks Isla thinks the lettuce is? +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..05caade3fe50d0acd349c940e4e705c6b606d78e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_9/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where is the spinach really? +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..37360408de8eecf4981290dc994a724a7e0f9b8c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_9/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Abigail really think the spinach is? +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..58dcd2483e7b808b569df35ee425c2e028128596 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_9/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Owen think Abigail thinks the spinach is? +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..21bceb1a61509ddf07cc50c3c315081f2af97783 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_9/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Aiden think Owen thinks Abigail thinks the spinach is? +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d99cfd550139452ea5e16f2c47ae0e6f9e37b692 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_1/sample_9/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Jack think Aiden thinks Owen thinks Abigail thinks the spinach is? +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b1e1da8f4943136959dda696f4eff9f2d4d008a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_1/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where is the persimmon really? +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b85cf01bbd53cbc4ab6cb0225da56ddedde2d69a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_1/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Owen really think the persimmon is? +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9da905c2768b5b698bc5cd7ec6e1469b542cd193 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_1/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Amelia think Owen thinks the persimmon is? +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..387c818fbaf2f21a9f8636dd76283db12eed3e59 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_1/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Aiden think Amelia thinks Owen thinks the persimmon is? +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b4a354a297f1d1379b38cfd81f892baaa170a4fd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_1/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Ella think Aiden thinks Amelia thinks Owen thinks the persimmon is? +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b106d6b1d5fd4ef590259e7d60d7e683e398a1f2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_10/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where is the persimmon really? +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..94158f2a2eefbb04a639de4734bc9d756e211316 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_10/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Ava really think the persimmon is? +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..856b72276b4cb80cb30e172e69d4ac6427129f62 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_10/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Evelyn think Ava thinks the persimmon is? +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8e349a2c9b5ac00f950ec0b67e0193ae09ee0b00 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_10/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Charlotte think Evelyn thinks Ava thinks the persimmon is? +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e1cbe2e218e5bafb793299548524df7fae8a9cdd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_10/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Benjamin think Charlotte thinks Evelyn thinks Ava thinks the persimmon is? +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..55d8315dfb2b749be7f92fc2eaa226d356e576d1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_11/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where is the grapes really? +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..10153cb45d1a8cabe70727f082004c59c851e502 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_11/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Benjamin really think the grapes is? +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ed76a7b4e29df121938b23a221fd27950fd55953 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_11/order_2.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Liam think Benjamin thinks the grapes is? +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..126c8120ee03418d0ca4bc1cdf794a6002b559a9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_11/order_3.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Elizabeth think Liam thinks Benjamin thinks the grapes is? +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..067a909978f1b5987031d1e6d9a755816a4da74f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_11/order_4.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Alexander think Elizabeth thinks Liam thinks Benjamin thinks the grapes is? +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f4f41bcf07d43de769c4ed60e9e45d191bac8714 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_12/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where is the spinach really? +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba67c866f2efdd336ff634e6bbdb4b9bcf7c3d82 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_12/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Avery really think the spinach is? +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b51c224324f071458ebefb308cb8f34c67e0b953 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_12/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Jackson think Avery thinks the spinach is? +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f9edf932cf5ff1125f62907432ab214701d62e38 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_12/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Isabella think Jackson thinks Avery thinks the spinach is? +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1728921ecaac2e9bfcd4bd8e2dbe958e8527614e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_12/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Nathan think Isabella thinks Jackson thinks Avery thinks the spinach is? +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..aee0dd730acd81285fe83d68af82adda4fe2304d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_13/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where is the watermelon really? +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d74254ad6115a495951e5a250af5124858933dce --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_13/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Jacob really think the watermelon is? +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5976e712cdd5835c99c09eae87ae7d30f174185b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_13/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Isla think Jacob thinks the watermelon is? +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f0c737772d157baa09a4e380473176b1fda6de34 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_13/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Logan think Isla thinks Jacob thinks the watermelon is? +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..48f71c72abfc790ada746294379ab73fb9ea2ec3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_13/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Sophia think Logan thinks Isla thinks Jacob thinks the watermelon is? +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..dcf50fceb1fc1902131df2d9443583885113db66 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_14/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where is the pear really? +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..178514505ce71625eb859ff906d612b72f39eeb5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_14/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Nathan really think the pear is? +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..330a875681eadd9622af43eb7856bacf9116d956 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_14/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Amelia think Nathan thinks the pear is? +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ff424c8dfaf0077551d59b48501578b1834c3bd2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_14/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Isabella think Amelia thinks Nathan thinks the pear is? +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..474d14d9a6f076b6be3025bb672fd406164207c3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_14/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Owen think Isabella thinks Amelia thinks Nathan thinks the pear is? +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..062e7a06f20e03193919c462e3c2fdd03cc5b6b7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_15/order_0.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where is the potato really? +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..80a34983f289d6e93cc744432564e9feb6bd1fea --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_15/order_1.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Charlotte really think the potato is? +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f16d64bb70becd42974f58dc6ab30a1a23de2f0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_15/order_2.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Noah think Charlotte thinks the potato is? +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..966b40318d524b6301191fe186aa9758f7e44e22 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_15/order_3.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Ava think Noah thinks Charlotte thinks the potato is? +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..697d5117409747026e1004bbd5799658784886ef --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_15/order_4.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Nathan think Ava thinks Noah thinks Charlotte thinks the potato is? +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0667a3302c10d950c849fef617c6b2f775b86fc0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_16/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where is the cucumber really? +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3e3867b16caba1868111bc3e65c425221a537024 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_16/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Benjamin really think the cucumber is? +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8e651cefc82fc96ca289a6fc017d95048e8a00bd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_16/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Charlotte think Benjamin thinks the cucumber is? +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c86d592319f325ab57b8a767df27d5e3548a9ec9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_16/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Evelyn think Charlotte thinks Benjamin thinks the cucumber is? +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..fe7f6c654b4b3c01ff0bae35b52f19ea2ed90d89 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_16/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Isla think Evelyn thinks Charlotte thinks Benjamin thinks the cucumber is? +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f231dbbaf1dfb24d381cc67a084e00edac7cdfe7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_17/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where is the cherry really? +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..053b2116e977a4147bde1487fb10bcccf2c1e6a8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_17/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Owen really think the cherry is? +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..af3a5f83574f95f51bc8cd82be86061f2395d4a4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_17/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Ella think Owen thinks the cherry is? +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4862e907becaa5b75326271babdd844a353d17b9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_17/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Abigail think Ella thinks Owen thinks the cherry is? +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0ad4f152cdafd68809d77656f3d17ba4a4e39b3d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_17/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Emma think Abigail thinks Ella thinks Owen thinks the cherry is? +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3ae631d625867e2bd5edc32e1556d7569eb304e3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_18/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where is the sweet_potato really? +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..023574776eb23f5649bd7cc4b204eddda4cd4128 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_18/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Liam really think the sweet_potato is? +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d6698c34623a8fc382a7a93c5956121db1fd999c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_18/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Hannah think Liam thinks the sweet_potato is? +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5263ba78d2ea6fcf49ba0a98bb1149b3b46abc1c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_18/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Evelyn think Hannah thinks Liam thinks the sweet_potato is? +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1de4b9b854cd13849f642f574f6736e21bbb96f6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_18/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Emma think Evelyn thinks Hannah thinks Liam thinks the sweet_potato is? +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a585c31b5a87e139063590bc016457a0a3f9c657 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_19/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where is the carrot really? +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0eed43f1acaa8e35f48e20afb9e5f3c1aa79d0ff --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_19/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Benjamin really think the carrot is? +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8fdd80df19385536a133eb8aa3f1fc727582e4c0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_19/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Noah think Benjamin thinks the carrot is? +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..490940c96b7be041e96a34a598e4647dbb7aed82 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_19/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Emily think Noah thinks Benjamin thinks the carrot is? +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ee99d415cbf5ed67b9d0d13e6d39ee2665c6d238 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_19/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Sophia think Emily thinks Noah thinks Benjamin thinks the carrot is? +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..415bc24aabbef596bc8b812605325c4374cd2d1f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_2/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where is the onion really? +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..860a013bc4c92141673e7319659562d017e35369 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_2/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Owen really think the onion is? +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b242870722826ea00737bf71401605faa4eab787 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_2/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Emily think Owen thinks the onion is? +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..07be0f0ca34f8613cd7aca1637fbcc069aed24e8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_2/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Isabella think Emily thinks Owen thinks the onion is? +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7f92b963658a4b9854223f807ce253437b39c4c6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_2/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Sophia think Isabella thinks Emily thinks Owen thinks the onion is? +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a4ee93d578c0c733f5ec87d1a37df1f42e96ff5e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_20/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where is the melon really? +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3092b971be6f0845f99ed836549a211962b140f6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_20/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Jacob really think the melon is? +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1a48f311f272436b679ea82622e8c9ba3ca90d3a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_20/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Lily think Jacob thinks the melon is? +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..70627d0dea50c77e5c8b1bf2d3b7b22aaa8be031 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_20/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Evelyn think Lily thinks Jacob thinks the melon is? +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..bf54d8c6ee38ec32568381c8866f527a447ed95b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_20/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Ava think Evelyn thinks Lily thinks Jacob thinks the melon is? +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca7f4a90123e2c41a5a40b01d8e7bb654f82df4e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_3/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where is the peas really? +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e901af2a52cf12cbf94464428f1e49ca4344074d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_3/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Emma really think the peas is? +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..540816d80073eb64cb38f8ca8112fccba021e648 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_3/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Hannah think Emma thinks the peas is? +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..fb3cc050be01b608a08771750d14363139837949 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_3/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Chloe think Hannah thinks Emma thinks the peas is? +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ff624dcb434e644c451c788354a6e5bda10803c8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_3/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Logan think Chloe thinks Hannah thinks Emma thinks the peas is? +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..53e312e21f4cd006c20687b561588dc9f319c7d2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_4/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where is the cherry really? +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9d12a780372db1cf68225ef7bcf8a948e783cc93 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_4/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does Nathan really think the cherry is? +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2aa539dc28b8ebc68aacb9fb8a12cd052bc74c2a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_4/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does William think Nathan thinks the cherry is? +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..61e560eeb65d2f167bc474332c553b8e49e5276b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_4/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does Ava think William thinks Nathan thinks the cherry is? +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c69034c33e6ee11cd08763367482284948e953a2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_4/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does Emma think Ava thinks William thinks Nathan thinks the cherry is? +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4bdc34881f5765a63fc2d9e6fdfd4f822ade45e8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_5/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where is the watermelon really? +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6b3778f6e176f45d1a67ada3cdffc118afa9098a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_5/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Benjamin really think the watermelon is? +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..752705d0286cbd0640e23ec3468eedc333d77ba3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_5/order_2.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Emma think Benjamin thinks the watermelon is? +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2c22976c17f4d6182f6f9a0499712366880423cf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_5/order_3.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Isabella think Emma thinks Benjamin thinks the watermelon is? +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e7afe74f66f35c7b301eb7fa65b7d8f826b39cc6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_5/order_4.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Liam think Isabella thinks Emma thinks Benjamin thinks the watermelon is? +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..11ee41ce67dedd4e4c55e44648a558a202855232 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_6/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where is the peach really? +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3b4c09d51bda7969ff6a6d29dcb0d502570fe0d2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_6/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does Chloe really think the peach is? +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1e01a7ff26e3ed81794cea93c4389a3a5be1fcc5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_6/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does Isabella think Chloe thinks the peach is? +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9bb40d333b286369c61a8a0733d631a6fa3fb17e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_6/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does Nathan think Isabella thinks Chloe thinks the peach is? +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b471bca1fb5cf1cd00c63d5430f7be9f94be9535 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_6/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does William think Nathan thinks Isabella thinks Chloe thinks the peach is? +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6a7c2f8529cb7e2cd5f43d7a9a3e27af4920924e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_7/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where is the asparagus really? +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..67bbaaa5f265ee3d9a5189a41ae1d111f2ad2005 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_7/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Aiden really think the asparagus is? +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a1cee8313b6aa331f46ff3b3629da2613aa91f15 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_7/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Emily think Aiden thinks the asparagus is? +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..33114a0f086c42db23e41e987c209c145eb5176f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_7/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Avery think Emily thinks Aiden thinks the asparagus is? +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..448d6b3305cf415c046bba59b04ffe3c159ea03b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_7/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Hannah think Avery thinks Emily thinks Aiden thinks the asparagus is? +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..45ccc0fb533153640d5d4608352d5e3ae08c0b80 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_8/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where is the lettuce really? +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..70dbf1041882830d4542718af04a70cb9330a83b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_8/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Isla really think the lettuce is? +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a2e9fe60a6c89853c556da690e910cad52f15c26 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_8/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Charlotte think Isla thinks the lettuce is? +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8f98c35b80f042329ef56eb49b2f1a38a671d3bd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_8/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Amelia think Charlotte thinks Isla thinks the lettuce is? +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7be331108703a9683614f9f3c6b062c32ddcce56 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_8/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Aiden think Amelia thinks Charlotte thinks Isla thinks the lettuce is? +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e2db1509ebbe3aeeeb8b046c79f98b3c2c01918f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_9/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where is the apple really? +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1b29bc8372a738cb102e212b37f056d2033cc588 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_9/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Jack really think the apple is? +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8a5fe0a8b376fe1f32eb38af59edf07039790b54 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_9/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Evelyn think Jack thinks the apple is? +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e12850c1ff845f078f803131958fd7bec5c5957c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_9/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Ella think Evelyn thinks Jack thinks the apple is? +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7c4b5dad520b4042f4d382f6d1b270335bd091b4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_2/sample_9/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Amelia think Ella thinks Evelyn thinks Jack thinks the apple is? +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e464eaea648b196ba2b354a4107aa701b97baf39 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_1/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where is the peas really? +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b74bfc111495fa2f64653c246cb8b45be5337bf2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_1/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Jack really think the peas is? +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..cee54088de55d72d8ca2c8e1cb2306bd92867d53 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_1/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Jackson think Jack thinks the peas is? +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..bdd71185d6a2de3417c916d5bf06b1f51bedf171 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_1/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Logan think Jackson thinks Jack thinks the peas is? +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ee5b571f5d22479c46015cf37de523f19ae8dfe5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_1/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Isabella think Logan thinks Jackson thinks Jack thinks the peas is? +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b106facba423f866c708734e5a72ad2234900140 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_10/order_0.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where is the persimmon really? +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2709c8fa66833b7eb8d32bddffa50dda974cb6a7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_10/order_1.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Mila really think the persimmon is? +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b65431675737b7f85f523dec3ddd89fd1584120c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_10/order_2.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Emily think Mila thinks the persimmon is? +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..363559aadb7f2c9a2803344265a7f5ad44a7da75 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_10/order_3.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Charlotte think Emily thinks Mila thinks the persimmon is? +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a08265caf2f95337b6ab4c9eea6d343f06ed067d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_10/order_4.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Benjamin think Charlotte thinks Emily thinks Mila thinks the persimmon is? +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..39c08c616a7b5bbb3aca15c6ddcf17172c43ebd3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_11/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where is the spinach really? +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e905405c839851510a4fb17c27f3f597bd4d19cb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_11/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Abigail really think the spinach is? +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4b9ae267794fae47e8bdd6fddea16e704a678a66 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_11/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Benjamin think Abigail thinks the spinach is? +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..bfa47bb8f4a01d8d501cf98875381e807f501be0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_11/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Jack think Benjamin thinks Abigail thinks the spinach is? +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9da6a35771e60d80f52e817f12ec3dee2405d820 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_11/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Amelia think Jack thinks Benjamin thinks Abigail thinks the spinach is? +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..01f81c97f861dfb7fa7652643fbca43381ca8a7e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_12/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where is the spinach really? +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8c17500f38ee54b0c212253a9963fd0954be2d97 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_12/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Avery really think the spinach is? +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e10f5ee32831b1dded51f0dae263a8ef94a2619b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_12/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Hannah think Avery thinks the spinach is? +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..917fabfe53e91670afb31991b7dfced5a01b5383 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_12/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Isabella think Hannah thinks Avery thinks the spinach is? +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..aed743d4bcab8b4f082a2577a25b38b15452642f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_12/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Nathan think Isabella thinks Hannah thinks Avery thinks the spinach is? +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f03c447415a9ee47c10b9d60fd8ebc2aa8345f9b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_13/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where is the onion really? +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4fb95b5ab2f985cf5845cb189ebd0f6f2461445c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_13/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Mila really think the onion is? +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..00f85a47b7da54d7aef26b7757ca06f8e2f645e6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_13/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Abigail think Mila thinks the onion is? +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..38bf08926a78a6749a997d07ef5ae7ff1acc836b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_13/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Jack think Abigail thinks Mila thinks the onion is? +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f6a82dfc6bf3e9a69c7077d1d2d56d261d3056a6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_13/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Emily think Jack thinks Abigail thinks Mila thinks the onion is? +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5884dae25c826a9a256c4785b63a41034e2046d8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_14/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where is the carrot really? +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..23500bec3a800545075d9e4006c9ceb5c98b47e7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_14/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Abigail really think the carrot is? +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..96eb122dfacbc37687b8bb07f9337b17e58404fb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_14/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Nathan think Abigail thinks the carrot is? +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..faa6bbee116bfffdce850b9102e9dab25703b668 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_14/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Avery think Nathan thinks Abigail thinks the carrot is? +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..df49b98e7c54b68923eaa0f889225a40d1c96e94 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_14/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Isabella think Avery thinks Nathan thinks Abigail thinks the carrot is? +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7ce569620ec90ec2bb2d8f98b8160d2de5ad2865 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_15/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where is the peach really? +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b1e2f1700e3ea6daa9468bab777a78962fc93e30 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_15/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Abigail really think the peach is? +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..399862454c5726923f27593e0c587eedc05c0fbf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_15/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Sophia think Abigail thinks the peach is? +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a373926d3f9e68ff0e9807a87296a14b5389d9e1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_15/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Aiden think Sophia thinks Abigail thinks the peach is? +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca7d0ddc8758af40000f9f8058eddbfd9124f30b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_15/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Isla think Aiden thinks Sophia thinks Abigail thinks the peach is? +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4ad105630b5dd3e31a7962d2388355fe0553937c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_16/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where is the cherry really? +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5a22abc209ecd7cee1f84a831904814a8efb6ec6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_16/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Aiden really think the cherry is? +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..403c8d256f79354e0f263664993406f0b2c90d32 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_16/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Noah think Aiden thinks the cherry is? +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..edac6b5bf13f46e5db1ea6322c54a62beabd3af6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_16/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Owen think Noah thinks Aiden thinks the cherry is? +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..bd24ceb37fd7189ac6540c03e4f20e35c0012696 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_16/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Ella think Owen thinks Noah thinks Aiden thinks the cherry is? +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b4351dd0892398516ef75a21444a5e844a1cc4cd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_17/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where is the turnip really? +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6c49fad7d082bef11aad4e627ddf15cd7499b738 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_17/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does William really think the turnip is? +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a30b3c9baf40b6a41b1ad5c8e2c859e6f7f741ba --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_17/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does Benjamin think William thinks the turnip is? +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..18cd0dc1be6f1bf196a31d1210d14d51651a72af --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_17/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does Sophia think Benjamin thinks William thinks the turnip is? +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f2388773d9d1aab9736723f7bae80df77b04811c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_17/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does Liam think Sophia thinks Benjamin thinks William thinks the turnip is? +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5aedf471f43893abd105ba65868325aa74790f0b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_18/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where is the cabbage really? +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..403892477c3746c1284676a3a8e0a2e2f0580949 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_18/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does Carter really think the cabbage is? +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b63d84464613071fffcdf0fafeb1914f1d01c50f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_18/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does Avery think Carter thinks the cabbage is? +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..03113324e7140917394e329485bdfdfb8016b4ad --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_18/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does Aiden think Avery thinks Carter thinks the cabbage is? +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..86d0d6215e3a72575712a1c352b2273b59aaf84a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_18/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does William think Aiden thinks Avery thinks Carter thinks the cabbage is? +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9e072e643ca4ee494ce07544786ec4fec16685b6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_19/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where is the cherry really? +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0c3dc05f2ceb3f5b4b75b585c802564a693e09ea --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_19/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does William really think the cherry is? +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e37422e855c02af7741c3db85bd897ceeba3e1de --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_19/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does Ava think William thinks the cherry is? +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..115abded9e610679ca011ed6ea2fe88af4558b40 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_19/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does Logan think Ava thinks William thinks the cherry is? +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..cf249aed68a130cb9a1ad6aece3d291d891060f8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_19/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does Amelia think Logan thinks Ava thinks William thinks the cherry is? +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..345507bd277bc095af64eb46ed47c46f6bd5c405 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_2/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where is the melon really? +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..32db49f8da4029eaa65b053661e50dd41611e617 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_2/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Aiden really think the melon is? +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..313c83e25a7621541a0d0798aa83a720138d278b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_2/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Owen think Aiden thinks the melon is? +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..33aed70fb00139bf72d77c5204b5a5ce351dc34c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_2/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Ella think Owen thinks Aiden thinks the melon is? +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f8aeef39fa0643f8dde8c7761df3d70e9ab90b60 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_2/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Evelyn think Ella thinks Owen thinks Aiden thinks the melon is? +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d35063111846c13c86c2f64d9485c93ee59404af --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_20/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where is the turnip really? +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f914273243c37003a1c47e2ba645594a0c6d8dd9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_20/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Owen really think the turnip is? +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..96ad1309f0025574c278835c3328328af9b157c0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_20/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Mila think Owen thinks the turnip is? +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2c83657ad7da34b0f0b26adb8bc45db7343517c2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_20/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Carter think Mila thinks Owen thinks the turnip is? +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7477ffd42f23f9bbd5c95519ceab2e6f65e50a2b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_20/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Isla think Carter thinks Mila thinks Owen thinks the turnip is? +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1aaf05329b7ea7a16cc9988289c7c1400d66c890 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_3/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where is the spinach really? +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..edf6e64aa2c66ae846167885231c75b6da8173ec --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_3/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Jacob really think the spinach is? +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d525c7f78d15dd200193a5fe28d34addd65fb8b5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_3/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Jackson think Jacob thinks the spinach is? +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c673ec1da008e4d34e997b792f96881540c0fc8c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_3/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Jack think Jackson thinks Jacob thinks the spinach is? +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b3939cea0c3de7cd0669d6b8a1dd4e52b96b5c05 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_3/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Ella think Jack thinks Jackson thinks Jacob thinks the spinach is? +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fcd038c0254ae8f56885693a244e09eaa4cbabdb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_4/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where is the corn really? +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cce2767df373537aba896f258f712775dc1191a1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_4/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Amelia really think the corn is? +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..926dd0d0947b90c2048b21be39b8db9434edede6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_4/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Nathan think Amelia thinks the corn is? +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f1bde0e514b967020b396f1a0d7d989407771b0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_4/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Lily think Nathan thinks Amelia thinks the corn is? +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..cec2efbc44ffa6bace9e91bbe930961292c448be --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_4/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Alexander think Lily thinks Nathan thinks Amelia thinks the corn is? +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6c1be9177ab3c2102a8e92abebdf581b40f7103c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_5/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where is the sweet_potato really? +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..27c8094f468157cf53a7fc903671107fac5f63b2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_5/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Sophia really think the sweet_potato is? +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..19f74e1cd681eeef3e7c5a4367227f47d68c7fc1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_5/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Jackson think Sophia thinks the sweet_potato is? +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..bd6b2e11bb36f84563465f74821bad4fbc43579d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_5/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Avery think Jackson thinks Sophia thinks the sweet_potato is? +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ab99d86b1e12d967cb0306cebb6cd6d742b17b89 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_5/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Hannah think Avery thinks Jackson thinks Sophia thinks the sweet_potato is? +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8cd38670133a62cf88fbe352553ca9bad5a430b2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_6/order_0.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where is the orange really? +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4308991bc959f9b8da30875c58810b53d86a67fa --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_6/order_1.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Owen really think the orange is? +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b4cded3c6da286c3e593b52f031227283174ff8c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_6/order_2.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Isabella think Owen thinks the orange is? +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e9f83dc4fafacbbc72a9636629e5947d9104de19 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_6/order_3.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Jacob think Isabella thinks Owen thinks the orange is? +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8eb29818e72c854c5efa03e21e56827fa0db6079 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_6/order_4.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Hannah think Jacob thinks Isabella thinks Owen thinks the orange is? +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4e5e20727f7bf963d2508d5b756c0e19a57f6e22 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_7/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where is the lime really? +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..85788fc86f0f21e98e03dec00979efb4d73efdd8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_7/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Amelia really think the lime is? +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca58989513203a0b6f33cebecb8b46f3466db8e1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_7/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Sophia think Amelia thinks the lime is? +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c62004553a73db85a51fc4c1bcf8bdf7e5d7f764 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_7/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Chloe think Sophia thinks Amelia thinks the lime is? +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..060339113bbe64b9f712d639e13a66b354114c14 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_7/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Isabella think Chloe thinks Sophia thinks Amelia thinks the lime is? +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a96ceef60f5071a510e86d1fddc77502c5260838 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_8/order_0.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where is the carrot really? +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ce0ff508fe7790cd4684c55c22c95f8a1874c71d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_8/order_1.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Chloe really think the carrot is? +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..74c589d5a41121896656e0c604bcdcb64215c410 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_8/order_2.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Amelia think Chloe thinks the carrot is? +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..43a084550e20d3b4a92108c6988e65e40815c091 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_8/order_3.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Avery think Amelia thinks Chloe thinks the carrot is? +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ed159b4db183bf23e23fe20a740b1d9a561c5700 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_8/order_4.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Sophia think Avery thinks Amelia thinks Chloe thinks the carrot is? +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..52aa4c5b31e4fd02ebf903d115bd16d2cf158c5d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_9/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where is the watermelon really? +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..63f704d4d1494a48354f9d35f4c7a007c3cb0102 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_9/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Isla really think the watermelon is? +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5b308aa6f415b052c89ae50ea7cce23ee7987e97 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_9/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Carter think Isla thinks the watermelon is? +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..df2cc8020e488a1fd91aa1117ff4271844e2235f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_9/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Elizabeth think Carter thinks Isla thinks the watermelon is? +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0200f225dda2de9714e413b7cdfdef51d2de1738 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/CoT/length_3/sample_9/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Nathan think Elizabeth thinks Carter thinks Isla thinks the watermelon is? +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fe76c69183ad333f33187fe08735dd0c8d2f923d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_1/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where is the carrot really? +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..51a3d950b69267ed244522fa914200103bb29963 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_1/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does William really think the carrot is? +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..47dda4c92bc2468811ac748f55382d576e03d1bc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_1/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does Hannah think William thinks the carrot is? +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2a31d715f66259cb360ae47b8e6a241e27a2d976 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_1/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does Jack think Hannah thinks William thinks the carrot is? +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ffb6b461696ba2caa4c73a74520a5d4ce7d6baa3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_1/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does Charlotte think Jack thinks Hannah thinks William thinks the carrot is? +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c6a312f26c9f34e91ccc90137b1ef2addf30143d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_10/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where is the potato really? +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..42867eeda053d0a86ca43c38d23de9cceb84b802 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_10/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Carter really think the potato is? +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..855b8e9bbfe4669367a1a93a3d693a355731ac78 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_10/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Jacob think Carter thinks the potato is? +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..302dc61421b5e5981160d9e26b8a7ec3a0439902 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_10/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Alexander think Jacob thinks Carter thinks the potato is? +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..28539070e1585f4eb7c88bfe783c43f645268547 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_10/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Jackson think Alexander thinks Jacob thinks Carter thinks the potato is? +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..289b9e247f7572f92aa7dba12b5536b8995fad62 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_11/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where is the pear really? +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b00d81c488776803464c38b451718c388159b8ca --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_11/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Sophia really think the pear is? +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8112ef20de2e759e3a2e1a3cdc1a8513929baa29 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_11/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Ava think Sophia thinks the pear is? +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..31c02aff3660a7407b2eb1a975a9ffb32490b3fd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_11/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Avery think Ava thinks Sophia thinks the pear is? +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3bcf64a307a966796664a60d927285037273f985 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_11/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Mila think Avery thinks Ava thinks Sophia thinks the pear is? +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4296bb7588645a2f4597294b0e4ef8660c04155a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_12/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where is the tangerine really? +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8ad00cd4f3b418ca33f40b7c3b74846da3a6213f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_12/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Ava really think the tangerine is? +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b2d6946dcffd45c90e4680359980ad169157e4b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_12/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Logan think Ava thinks the tangerine is? +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..611ec521398d2a37e5828e6e9ba27d74394010ce --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_12/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Owen think Logan thinks Ava thinks the tangerine is? +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..97467e698968251c76cfdd60261485f1d8cad4d1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_12/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Elizabeth think Owen thinks Logan thinks Ava thinks the tangerine is? +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..193e81e8c144f82f54e3be91139cdcd5b3c4a21f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_13/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where is the onion really? +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c118d81219bdfe01a367d65873e17f38c5ea3a76 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_13/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Owen really think the onion is? +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3d902d22d390062f22f28d53bee3b8266005b020 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_13/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Elizabeth think Owen thinks the onion is? +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d141996055207708d570f8c3198a7f036b93cc51 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_13/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Liam think Elizabeth thinks Owen thinks the onion is? +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b84ff916d02b191eb3c760eba28e8b3654bead49 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_13/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Noah think Liam thinks Elizabeth thinks Owen thinks the onion is? +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e351c16e8e04f8a429526cb0c3cb1ae6f0ef745d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_14/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where is the tangerine really? +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2e36781c649073da990a4d1fa8443e2d68337007 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_14/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Mila really think the tangerine is? +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4fd5aaebc4ff0cac7b642f3e58c106114d958e28 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_14/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Amelia think Mila thinks the tangerine is? +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..70d09a1ed567c65a1c2a8e0b06ffa1df84ac2f7a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_14/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Elizabeth think Amelia thinks Mila thinks the tangerine is? +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..362f8b3c65a1f13bd96c13d8442e9ae3d84f6a5a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_14/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Chloe think Elizabeth thinks Amelia thinks Mila thinks the tangerine is? +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f393cf88e2a8cfce7f246754aea57cb06004700 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_15/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where is the tangerine really? +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8e6ef8cc4b8b7a92b8264993fbfceb4d95e71d95 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_15/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Amelia really think the tangerine is? +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d1a71e8b6ff56b68c473d93ecf739245316ecc09 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_15/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Ava think Amelia thinks the tangerine is? +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..341ec79aab259de5be2a2550b6ec126f27f10243 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_15/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Carter think Ava thinks Amelia thinks the tangerine is? +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..efe81ab4400104024d3a8c97d999a16be69defbb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_15/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Abigail think Carter thinks Ava thinks Amelia thinks the tangerine is? +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..bf4f75335805d133634b4272b6730d44a883d58b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_16/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where is the tomato really? +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f801f39ea09f838595769c2b7f079604c39aba2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_16/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Jack really think the tomato is? +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1e5e4f6e093a34c62cea28dc50a0e639e4461c02 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_16/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Isla think Jack thinks the tomato is? +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..63ddf6d76c5d1fa1381cb75b52c4dc60009e77f7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_16/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Carter think Isla thinks Jack thinks the tomato is? +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..97f40b9ab7e5c1711975fc851ead30c08b2634ee --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_16/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Aiden think Carter thinks Isla thinks Jack thinks the tomato is? +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b44955d7657f5014ee6259f803ed316df41f062f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_17/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where is the green_pepper really? +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f03ae79b724416099e25977f3ed3f0fcdf2400c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_17/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Alexander really think the green_pepper is? +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..db65b863c5d2c298d7a1f4fca7a79f4c5c1fcf59 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_17/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Evelyn think Alexander thinks the green_pepper is? +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..89e854984119387be4bd7b7e5e366c36f0270e55 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_17/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Hannah think Evelyn thinks Alexander thinks the green_pepper is? +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..768eb652d9e14ab5675a8b54a0453db3be8ffcaf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_17/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Abigail think Hannah thinks Evelyn thinks Alexander thinks the green_pepper is? +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..18e252da415daaac99fcb6c69192df7914b4206b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_18/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where is the cabbage really? +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..629227b31ecffb2dc05c292f436895458ada0afc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_18/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does William really think the cabbage is? +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc31cbcdc854a63570d882425db339bd5154f337 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_18/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does Nathan think William thinks the cabbage is? +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..0c5dfb5531d9d1d0f1376b81ab132082c5f49977 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_18/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does Aiden think Nathan thinks William thinks the cabbage is? +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b5ac1b2748032a226dff6b0e532969bfcc636a5e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_18/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does Logan think Aiden thinks Nathan thinks William thinks the cabbage is? +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0ad8947b6e0bf6552ef9f7ab9713337cdb9e0574 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_19/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where is the green_pepper really? +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..61f707616aa79fe07a9197cab3c9fd5d513666ba --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_19/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Logan really think the green_pepper is? +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7ad240b0bfe1dbf03e2c4302e06e4a84ba981e0a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_19/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Lily think Logan thinks the green_pepper is? +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6bd7282b09102c1382bd7419b31b4bb7a473da39 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_19/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Ella think Lily thinks Logan thinks the green_pepper is? +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1580f856926c48f183af097ec64a2686db968c95 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_19/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Elizabeth think Ella thinks Lily thinks Logan thinks the green_pepper is? +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ccaca9a04756f19f0f63bc4cd1e14ba9b810637e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_2/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where is the lemon really? +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b6c0de26463eb4b57f34befe9e2ac9769265b975 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_2/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Lily really think the lemon is? +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..45ccd53bc0cf5878b009a08209c57850ee372b83 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_2/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Avery think Lily thinks the lemon is? +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ff09ff5587f50e634561e1f63ff0ccf46905b4e3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_2/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Liam think Avery thinks Lily thinks the lemon is? +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6b5a880694e25fd1eeae9d544763fbc9418f2256 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_2/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Noah think Liam thinks Avery thinks Lily thinks the lemon is? +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a70f67aa12e73d696a6f016e9ae759a1d2b52c05 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_20/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where is the peach really? +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..395299da35ca5ba2f628591ae05ad9fed27d93eb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_20/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Avery really think the peach is? +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f31f123da7d08855106a496be77c7241fd655a8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_20/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Liam think Avery thinks the peach is? +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7fd38a473f6bf148a3f44b2079b56715a7de2fa3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_20/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Benjamin think Liam thinks Avery thinks the peach is? +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..618ffbf79ae3707f64e5f34c536f2a39fabfa81e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_20/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Hannah think Benjamin thinks Liam thinks Avery thinks the peach is? +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..88c5293039f3899c98e047b88785f6ba91c50af8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_3/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where is the onion really? +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d01e3688fdb0cc239f73e38aeb250082d0634ea1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_3/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Lily really think the onion is? +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..bb1c1cb7563a388a8838167acb5000d7c6d91942 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_3/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Avery think Lily thinks the onion is? +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9ad6f4e9175d18fe710faab6a077d59534d1c3dc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_3/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Emily think Avery thinks Lily thinks the onion is? +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c662feb7d1b0658e172666218adb3173fa5a80e8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_3/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Elizabeth think Emily thinks Avery thinks Lily thinks the onion is? +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6c7c3afb61ca5b006451f01ccc384b8e0f8174e6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_4/order_0.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where is the cherry really? +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fc1fa1c876042cec03af907c881520c098723038 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_4/order_1.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Jackson really think the cherry is? +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..fa9748323603d6733dc834838c11102f64eb8bd3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_4/order_2.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Benjamin think Jackson thinks the cherry is? +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b56a33486fb3b3caf9c68e94a534bb5bbef1d59 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_4/order_3.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Mila think Benjamin thinks Jackson thinks the cherry is? +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c7de201318ecd660f09625cce6b4eaab6d19e1e5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_4/order_4.txt @@ -0,0 +1,21 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Abigail think Mila thinks Benjamin thinks Jackson thinks the cherry is? +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b71f76756b4182aa2e3bcecc7e297e35b08ff4e5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_5/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where is the asparagus really? +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..95f38701caa21b684571ce82da9c5c0e9934101d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_5/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Logan really think the asparagus is? +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..039b44206b4df311a6e9e2b374bd77ff70d1b260 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_5/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Sophia think Logan thinks the asparagus is? +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1824f84b07863406d4906610275f8ced3ac86188 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_5/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Elizabeth think Sophia thinks Logan thinks the asparagus is? +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a914ce7fdeba0c065690aa17502e16ff8bdc4936 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_5/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Hannah think Elizabeth thinks Sophia thinks Logan thinks the asparagus is? +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2e1cc1d7a7e1e458e390c0620183267b53dc2912 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_6/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where is the watermelon really? +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6fb5017ca9b9e69208eade7d57fc82df7f2a58ac --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_6/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does William really think the watermelon is? +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2d90830125256a22fb2c2f97930f41d757dd257e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_6/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does Carter think William thinks the watermelon is? +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..70cee65605632d6d84e66724770d137312e27bb0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_6/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does Owen think Carter thinks William thinks the watermelon is? +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5d0ce1dbb5d9be1ffc396078ee40a8131469bdc0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_6/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does Emma think Owen thinks Carter thinks William thinks the watermelon is? +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0acd5e3530c35f59af36846eccf2b65e1ac0773d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_7/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where is the tomato really? +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0502a60aff84865c36ab65792106d4580b860fd3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_7/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Emma really think the tomato is? +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8d700e4a17597c8ccba381179a6730d186121c98 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_7/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Liam think Emma thinks the tomato is? +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b53a711d5b18e90dfe54be660d31669ddc2999d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_7/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Hannah think Liam thinks Emma thinks the tomato is? +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0ec5a30c98801b6f98797aab46ca77bb5e85ca96 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_7/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Carter think Hannah thinks Liam thinks Emma thinks the tomato is? +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7f8c222364fc85d9f52a22836aa0dddb7b3343d4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_8/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where is the lettuce really? +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fdd9904ade9a308fa52e6a499b39c92048f1ebdb --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_8/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Isla really think the lettuce is? +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e70ca4a73f450602430ef1bb2d4028828a1e64aa --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_8/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Benjamin think Isla thinks the lettuce is? +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6d13892790fe9e8a8888c32cb3eaf250daa13942 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_8/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Sophia think Benjamin thinks Isla thinks the lettuce is? +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..012b0143669ed0b340406eab470eee33c32e9d24 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_8/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Emily think Sophia thinks Benjamin thinks Isla thinks the lettuce is? +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..43346a5bc9f1fc3e364886fdba08efb175dbd144 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_9/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where is the spinach really? +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..561c7b65b788f97df18ba97a6faeaab0d143c38e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_9/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Abigail really think the spinach is? +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..695d4b844e3976dba21fd0cf1e621fe5230f829d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_9/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Owen think Abigail thinks the spinach is? +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..899f792de5fa0b83f5f24a398c9c44487de163d7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_9/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Aiden think Owen thinks Abigail thinks the spinach is? +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3a2fce4e43a1a0a060863af10484185d0264ec0e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_1/sample_9/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Jack think Aiden thinks Owen thinks Abigail thinks the spinach is? +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..74978ad157cc31c81eeba83a66f0955d0c10d352 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_1/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where is the persimmon really? +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c957155955c58e1b8334d1aa70cc583b13022bd3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_1/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Owen really think the persimmon is? +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..0702858e03343e2ae0facc021b546e06d3e5a2f8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_1/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Amelia think Owen thinks the persimmon is? +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1565ba302c42040e379d4da5cbc59b96643dc158 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_1/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Aiden think Amelia thinks Owen thinks the persimmon is? +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..915c5b12718538c527878d78ee345dab73e96e01 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_1/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Ella think Aiden thinks Amelia thinks Owen thinks the persimmon is? +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..dcb86fa2044feb9f8d9a3df8ae5380b761332891 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_10/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where is the persimmon really? +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6e895ac2c29c8f1221a582767385ceb025f5a537 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_10/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Ava really think the persimmon is? +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..50c58734c6f8550bf52779dc7b971eb6bbac3656 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_10/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Evelyn think Ava thinks the persimmon is? +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..34db0fd7f5ad32d8035587105d86c9ddc56fc7e9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_10/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Charlotte think Evelyn thinks Ava thinks the persimmon is? +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e34bcf24eb1bf216c2a63d13d0777cd39f4efff8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_10/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Benjamin think Charlotte thinks Evelyn thinks Ava thinks the persimmon is? +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7ca5890dbcfdcb30510d02b2ae99ed46403e6fe4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_11/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where is the grapes really? +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..874fd0b18bdac450a65f30fa79e5f6418329f305 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_11/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Benjamin really think the grapes is? +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..72459e0f60ed6b9b5bacb340f215a7f0b312cee3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_11/order_2.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Liam think Benjamin thinks the grapes is? +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2710932cae105c878e466c4abf51ebd66b6af027 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_11/order_3.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Elizabeth think Liam thinks Benjamin thinks the grapes is? +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..be2d4f65aef15b7404c02039e7aaea5efa11fc44 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_11/order_4.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Alexander think Elizabeth thinks Liam thinks Benjamin thinks the grapes is? +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..99fbe007cc21e0789f6f559590ec42ffcd348aea --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_12/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where is the spinach really? +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d0df3a61af7f846dcb122e1cb2be1e17ea02c02c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_12/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Avery really think the spinach is? +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..50c0f00285b21fdba605953ad5b7dc19e6ec1e7c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_12/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Jackson think Avery thinks the spinach is? +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f07ed394998ad0289065033b020bb94f2127cbe2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_12/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Isabella think Jackson thinks Avery thinks the spinach is? +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5b6d328aa32308d1ee684c323fa0a12b37736d85 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_12/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Nathan think Isabella thinks Jackson thinks Avery thinks the spinach is? +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a6aa54ec35ffa1488547fdd315d52a0765e52651 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_13/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where is the watermelon really? +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba7ab189d7859eaf48a93ae8ed5a8a3af253fa45 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_13/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Jacob really think the watermelon is? +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..33809f7f07c430042d50a39cca6b54f00d883051 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_13/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Isla think Jacob thinks the watermelon is? +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4cf470afc8e32b44a0b3f976313be90e03dec0ad --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_13/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Logan think Isla thinks Jacob thinks the watermelon is? +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e73b956920ffaf611b23ebe4722c78b73d6a1021 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_13/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Sophia think Logan thinks Isla thinks Jacob thinks the watermelon is? +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8ee257e0261cf9c80d8e9f02d635c7f702e6006b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_14/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where is the pear really? +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9dc26280400b2d90ce28f04ddeb54674547b7817 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_14/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Nathan really think the pear is? +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..0a1e75a34f988e36439797fcf56d293fab282650 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_14/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Amelia think Nathan thinks the pear is? +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a5e6b01bc144f73062ccd135e60cbb6e4688aa46 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_14/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Isabella think Amelia thinks Nathan thinks the pear is? +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0fb396bc2c7ee75f50d7ab5443d4795943cd65e8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_14/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Owen think Isabella thinks Amelia thinks Nathan thinks the pear is? +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a65a9a3aff941223dcb1f4c07e52abbcc9802895 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_15/order_0.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where is the potato really? +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..030b7a3778eb2d3f9f764fd6c87b90675bac3eba --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_15/order_1.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Charlotte really think the potato is? +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3224b9259e1c89afd2a7d43a84e016fbed9ffad6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_15/order_2.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Noah think Charlotte thinks the potato is? +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..01a05e232e503329b997ea92de2a34337d5c4a75 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_15/order_3.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Ava think Noah thinks Charlotte thinks the potato is? +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..bf437de5b73798cac83d3605f73c42d4c250c677 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_15/order_4.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Nathan think Ava thinks Noah thinks Charlotte thinks the potato is? +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..66cd284f3a800c937bfcf8d8f44fe232731b0dd3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_16/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where is the cucumber really? +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..166cb17c85db15a035ff8aada283eeedc647a80e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_16/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Benjamin really think the cucumber is? +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2a4cfc4e8a11a8e4856297dcdcc5eeaac92c4d5e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_16/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Charlotte think Benjamin thinks the cucumber is? +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ccb770a06804e394963b965d0eeb0fdfc4acf9d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_16/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Evelyn think Charlotte thinks Benjamin thinks the cucumber is? +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9df26bce981a6b7ac6d1768cdac1d5eca4f26f16 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_16/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Isla think Evelyn thinks Charlotte thinks Benjamin thinks the cucumber is? +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7325511acbf512f59638740220bc5415d836645b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_17/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where is the cherry really? +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..27fdac2aabf9f95be5b0f9a506206322332a35fa --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_17/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Owen really think the cherry is? +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..bec5abad6cde2a3a6cc7e39a4f3dfda404b427bd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_17/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Ella think Owen thinks the cherry is? +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba7ba7d73d84fbd4984c31e7752c3fc7309b7d5a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_17/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Abigail think Ella thinks Owen thinks the cherry is? +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..634903e39f40fe2094769d834298ef042ef2568e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_17/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Emma think Abigail thinks Ella thinks Owen thinks the cherry is? +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..50a76c598045447a964cafba9268ec1a128a83a9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_18/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where is the sweet_potato really? +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b69a855ae4b42b828cca24029f269dd69e8aa62 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_18/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Liam really think the sweet_potato is? +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c21f80cd80e5892f52cedbec21900947657ae942 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_18/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Hannah think Liam thinks the sweet_potato is? +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2ad09d4cce93fc8ca53d22cbe9d40108512a2312 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_18/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Evelyn think Hannah thinks Liam thinks the sweet_potato is? +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..23facba2abec300697f0ec064a35bb7563ddb6d4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_18/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Emma think Evelyn thinks Hannah thinks Liam thinks the sweet_potato is? +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9820ffafca3e0790ffcbf73ddff25c80da87b255 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_19/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where is the carrot really? +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f1754bedac20a7b6934075be7ef0ae7a983053d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_19/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Benjamin really think the carrot is? +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..856e831e416f09e5cafeb053cea8ba2d6a21de17 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_19/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Noah think Benjamin thinks the carrot is? +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e0f3221af45864e7ab22b3750d3730971fd0188f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_19/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Emily think Noah thinks Benjamin thinks the carrot is? +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0f39724c7b28a3a24f14e80d940f5af22069dedf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_19/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Sophia think Emily thinks Noah thinks Benjamin thinks the carrot is? +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fa7287bb84d12013909bbe0a729433e00a0aa434 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_2/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where is the onion really? +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1d45c8ff6a9e88462ae3a328517daa6a07eacd4b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_2/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Owen really think the onion is? +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6a4653a4cac357f3aa689aee7ef944a8a54f3148 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_2/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Emily think Owen thinks the onion is? +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cd3d44c2c9975e86fa9063d356982ea60e257648 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_2/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Isabella think Emily thinks Owen thinks the onion is? +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f9b60ba7beec218a06d31060c2e5aab8db75e63d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_2/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Sophia think Isabella thinks Emily thinks Owen thinks the onion is? +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8dcda8ea65b596ed5bc7894b68efc258c7e345ef --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_20/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where is the melon really? +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e3ad04011a0f1ae0cd63ad770afb3ba673a3f38c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_20/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Jacob really think the melon is? +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ea456631358669d1a387292230c6d8a310bbbe4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_20/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Lily think Jacob thinks the melon is? +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..dc88ba2f0fa6cfc17619192cf27a17535525be37 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_20/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Evelyn think Lily thinks Jacob thinks the melon is? +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d8329890d18469f10569cddd4ea0edbe732cfe59 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_20/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Ava think Evelyn thinks Lily thinks Jacob thinks the melon is? +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..89c05986648a656c38fad9e92c2900c76f1f5bbe --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_3/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where is the peas really? +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ed9e18c986b577c3b20ae66721a7b424562f38f7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_3/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Emma really think the peas is? +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d8190a1c9f1a5b71d0d12d37697e6a04754724e1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_3/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Hannah think Emma thinks the peas is? +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..87924046dbafca78103d8990a0150e1ea1b146d9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_3/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Chloe think Hannah thinks Emma thinks the peas is? +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1fdc7130ea3b9e948dcf5757a144aa2d0d595af0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_3/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Logan think Chloe thinks Hannah thinks Emma thinks the peas is? +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..89a41717c8fff4c444b41fd3bb7a79f5213c1e6a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_4/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where is the cherry really? +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5ebbb27df2249d830fa65e8deb13e1ff0e91f1c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_4/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does Nathan really think the cherry is? +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b14129c1a37a9e7eb76556f1853c17d2e23c6bad --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_4/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does William think Nathan thinks the cherry is? +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..195400ca7c72f47a0d5a94a2705cb8e74989093f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_4/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does Ava think William thinks Nathan thinks the cherry is? +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b5c5825ed8d1c6c5bdfd40fbc176dfebc9b46cc8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_4/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does Emma think Ava thinks William thinks Nathan thinks the cherry is? +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..dd7837eb6bd9ac05aa5cb905f74808c3cbc3d3c7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_5/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where is the watermelon really? +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..62737e111c86d4ba2039ec68c96879362a1eb076 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_5/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Benjamin really think the watermelon is? +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..31a4c1d0d895c3059a163506d22818addbafea88 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_5/order_2.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Emma think Benjamin thinks the watermelon is? +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..da04025ae53e04cebd79e575316d7cea8e2bd29d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_5/order_3.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Isabella think Emma thinks Benjamin thinks the watermelon is? +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..297691f6e2377619d1ab1f08c906b18f1bf2d620 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_5/order_4.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Liam think Isabella thinks Emma thinks Benjamin thinks the watermelon is? +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..38f3e96efb04303e43a7d7ed656037511e0288b9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_6/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where is the peach really? +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..069425045b9fbdfc0de6f0d5d803b259be509055 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_6/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does Chloe really think the peach is? +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..0ff6a9149fb2a6163e9410e5e158a3053046b9f6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_6/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does Isabella think Chloe thinks the peach is? +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..51b055096d0ecce3152f74a987c9a8822ac56e66 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_6/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does Nathan think Isabella thinks Chloe thinks the peach is? +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..173e911c22a686a9f1781b0fee5bda071f0e2706 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_6/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does William think Nathan thinks Isabella thinks Chloe thinks the peach is? +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5060fcbe868e30b1cae6b52322376679da81cd23 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_7/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where is the asparagus really? +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1b7b370e3407bda17d9c787157584220b83ad9aa --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_7/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Aiden really think the asparagus is? +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5bb4690d677b16e8eaa2d0304ca63e1f422faac --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_7/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Emily think Aiden thinks the asparagus is? +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4b9cd5b855711813b24b7c493e17fec713437966 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_7/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Avery think Emily thinks Aiden thinks the asparagus is? +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8f159f5d65cba7380f724c435e3e33910e6e20fd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_7/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Hannah think Avery thinks Emily thinks Aiden thinks the asparagus is? +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9e88ed81e08156026fc21f427ce758c7c541ff71 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_8/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where is the lettuce really? +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..07f47d929380b5912eb96534843e6a8022bc7fb2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_8/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Isla really think the lettuce is? +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..875072bddd4d330739d5e3b3cc22230ea022acdc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_8/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Charlotte think Isla thinks the lettuce is? +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..3fb9da8eea5973ae756acba4ede173425dcfd344 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_8/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Amelia think Charlotte thinks Isla thinks the lettuce is? +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e1798f7a4904ce717b5b20eafdb9f4ef0a567ebc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_8/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Aiden think Amelia thinks Charlotte thinks Isla thinks the lettuce is? +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8865a2c446b5c30d740549162b4b2870e5cd9d98 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_9/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where is the apple really? +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3cad14df76383994fb1e722aa7f4e269589875af --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_9/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Jack really think the apple is? +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4bba6f1f4f51751b896caeeb0d7f4c08b4c089ea --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_9/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Evelyn think Jack thinks the apple is? +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..25faafd63127f9803f93de7bf9873f82416901fd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_9/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Ella think Evelyn thinks Jack thinks the apple is? +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..077f8007368a5d4b1941200de5f236995e364125 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_2/sample_9/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Amelia think Ella thinks Evelyn thinks Jack thinks the apple is? +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_1/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0d3ca9f713509d77923abdfe9d23a754f68e0c48 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_1/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where is the peas really? +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_1/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fbe26e8f40a767c769c297e5f3c9fb1d3fc55cf0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_1/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Jack really think the peas is? +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_1/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3658fe7d4710a6cbc9ca0dd5423f91a99865ee8b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_1/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Jackson think Jack thinks the peas is? +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_1/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1eb29d8d689bafa66d300c8a478271dbc2162932 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_1/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Logan think Jackson thinks Jack thinks the peas is? +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_1/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e3b4163c64e37f743891bb8d90877611b23cbe5e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_1/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Isabella think Logan thinks Jackson thinks Jack thinks the peas is? +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_10/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..32f96f754db8bdb2629e096c6325526bab20f234 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_10/order_0.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where is the persimmon really? +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_10/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1f5ee2106c9a30b0ac429d61dd3fca66a83cfd5a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_10/order_1.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Mila really think the persimmon is? +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_10/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..566fd15ec7ea46f1d2679506e1fe2841fe979db1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_10/order_2.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Emily think Mila thinks the persimmon is? +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_10/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..13d425843347262f1d66f2e2bacd19d1869577a8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_10/order_3.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Charlotte think Emily thinks Mila thinks the persimmon is? +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_10/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..55f492abbf9768d497189f3729f0335d2f07212a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_10/order_4.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Benjamin think Charlotte thinks Emily thinks Mila thinks the persimmon is? +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_11/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e885131cbe6e1f5b48d8a10b092b1bf00dc56d7c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_11/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where is the spinach really? +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_11/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..80eec26a0b61ab7f270772587298bfd8ed60c95a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_11/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Abigail really think the spinach is? +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_11/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..83c9b61ff9cc8f2301347a26aa59006713161641 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_11/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Benjamin think Abigail thinks the spinach is? +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_11/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9fc666c75229caf7bcddc332dcb844de739dc2bf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_11/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Jack think Benjamin thinks Abigail thinks the spinach is? +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_11/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f0a504365bee292c9293ecbfa5051c591b847e71 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_11/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Amelia think Jack thinks Benjamin thinks Abigail thinks the spinach is? +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_12/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..991ffe3607ad4f918dedee9e66691465202f58f3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_12/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where is the spinach really? +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_12/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..bb453bcc50964e7f49abcee4fddf4c1aa62e1095 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_12/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Avery really think the spinach is? +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_12/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e41ef5cebd0a1b9912b05b32fb9660783fde1f37 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_12/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Hannah think Avery thinks the spinach is? +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_12/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1d700849db0ec601928e4ef26545b9afedce3e3d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_12/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Isabella think Hannah thinks Avery thinks the spinach is? +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_12/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4080fb6114921df0d002e81a54afbdcbf9d236c2 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_12/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Nathan think Isabella thinks Hannah thinks Avery thinks the spinach is? +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_13/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e027ff6131043d40db37159bbf0029bf54c1b786 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_13/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where is the onion really? +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_13/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4a78cf5f5e8f8c643122000a5262917798f249c4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_13/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Mila really think the onion is? +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_13/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8d2c20270f51d98652537b1ffcdd62c4cc210338 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_13/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Abigail think Mila thinks the onion is? +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_13/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..58d7099d82d60cb46d4c24eba3f509f91affc157 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_13/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Jack think Abigail thinks Mila thinks the onion is? +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_13/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..80426273e643c9943864705ba1d56699a713e36e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_13/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Emily think Jack thinks Abigail thinks Mila thinks the onion is? +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_14/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4ecf8fe8d974543e880b38c1a9b315a4047918c0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_14/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where is the carrot really? +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_14/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..742b68b49e66c48d7e1ea5001ef4494adfffe7ec --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_14/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Abigail really think the carrot is? +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_14/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e7a29f6769ea66cbbd549e7d5fc8e25db273304f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_14/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Nathan think Abigail thinks the carrot is? +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_14/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1ee883d3dde7e6d729f68d4e326e7be8b6d5f639 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_14/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Avery think Nathan thinks Abigail thinks the carrot is? +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_14/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..bfbe84349ffe8bfc2886b105dd3e590d041fcb2a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_14/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Isabella think Avery thinks Nathan thinks Abigail thinks the carrot is? +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_15/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..45ebf35e5bacbcfe48a5b3b2bd0349c2231143b5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_15/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where is the peach really? +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_15/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..858477a58280ccbe04670cc57babc16e73cb218f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_15/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Abigail really think the peach is? +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_15/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..161239ab6781c2ebc32e2d0a9bad76daf2fc275d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_15/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Sophia think Abigail thinks the peach is? +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_15/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d7cf4abdf60feb757c785d20a482acfe3ad3302a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_15/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Aiden think Sophia thinks Abigail thinks the peach is? +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_15/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8f4146abbf8692ab4510ddd64f6159c7e0c364d8 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_15/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Isla think Aiden thinks Sophia thinks Abigail thinks the peach is? +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_16/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0d16a2fa729a341453a7c9da9d054deaf336ee23 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_16/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where is the cherry really? +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_16/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2e6aba05da2735ba94d69d647840ba133772585d --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_16/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Aiden really think the cherry is? +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_16/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4e9325d5beb5fac1c9330e11d1b1ee572d4aeb4a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_16/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Noah think Aiden thinks the cherry is? +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_16/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b50c513e97afe664011811813d153d7e0ffb812b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_16/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Owen think Noah thinks Aiden thinks the cherry is? +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_16/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9c0846596595acafc6d6c3a1fb2f99232f21566f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_16/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Ella think Owen thinks Noah thinks Aiden thinks the cherry is? +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_17/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4cf4c2b98dfc68896c289087820992427c85fa65 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_17/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where is the turnip really? +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_17/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..64f06df13318a01e6d1dd868bc2f20771300b884 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_17/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does William really think the turnip is? +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_17/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8c3a9572e703e111a435050f3df741527cc2e6ad --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_17/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does Benjamin think William thinks the turnip is? +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_17/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..089f32b389fa2d62e2f7ab540a50d6b9da2c580f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_17/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does Sophia think Benjamin thinks William thinks the turnip is? +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_17/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..84293a9123f296411c7e559b6a6c63677a3f25da --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_17/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does Liam think Sophia thinks Benjamin thinks William thinks the turnip is? +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_18/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..01c678d26d4900a7b93c1a307fb34138f58bce15 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_18/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where is the cabbage really? +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_18/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9c805c5c5780c5bcc40784a7d1fb1f494e239f64 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_18/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does Carter really think the cabbage is? +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_18/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5453859e133c74ecf5f9d303ad688556d9470888 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_18/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does Avery think Carter thinks the cabbage is? +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_18/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..29e7141ea03887576f7c0c8a5df63d5aae99d355 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_18/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does Aiden think Avery thinks Carter thinks the cabbage is? +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_18/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..54f883850de09b1d7be1c248d18fef11ba56cb53 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_18/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does William think Aiden thinks Avery thinks Carter thinks the cabbage is? +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_19/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7ef708e097080f202167b7db2f351da9775dc757 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_19/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where is the cherry really? +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_19/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..90c5bdf444a12be1b37eaf2f614a1f8bbb1d5fbd --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_19/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does William really think the cherry is? +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_19/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..68f4f3eea801a1b5857cf783fe6d1d45cee24a41 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_19/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does Ava think William thinks the cherry is? +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_19/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..fc564c269716b415d4585f6379ae2f7005ca6e33 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_19/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does Logan think Ava thinks William thinks the cherry is? +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_19/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..13ff3a8eb7e31355c9d08a30fc2eeabe113e414b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_19/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does Amelia think Logan thinks Ava thinks William thinks the cherry is? +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_2/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b3dd845157bca47726361f2ad9fee77e1ef6d0a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_2/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where is the melon really? +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_2/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d0d14626fbfeaa78e67019808d2f66f073870a2f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_2/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Aiden really think the melon is? +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_2/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..af12edfb2aaa12592b41666bee26ae8ac0bb3a4c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_2/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Owen think Aiden thinks the melon is? +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_2/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5ff096d55edc90a8f7aba9b9dadd7840d3436d11 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_2/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Ella think Owen thinks Aiden thinks the melon is? +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_2/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..256d15e55e5832497ce41b29c7cfe2c244f13bfc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_2/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Evelyn think Ella thinks Owen thinks Aiden thinks the melon is? +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_20/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e2dd63af30108dc400a23673b413c2163f5d2333 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_20/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where is the turnip really? +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_20/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6a6ea423436c56bc5a6f7acdcc7f6c20f4c3ce93 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_20/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Owen really think the turnip is? +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_20/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..301adfbfb0ee11c60ca9d9218f08988fdcd4f7f0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_20/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Mila think Owen thinks the turnip is? +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_20/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cbe660416dd0461b8dc034ebe3dc687e0ad1d364 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_20/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Carter think Mila thinks Owen thinks the turnip is? +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_20/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a64e4084244063b69006e5e7dbeeb33267b91ad0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_20/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Isla think Carter thinks Mila thinks Owen thinks the turnip is? +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_3/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3074279242bada1dc9dd8704bf91891eaf87abc4 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_3/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where is the spinach really? +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_3/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..eaa98915defdff6e8927f93fcbd728e7f41e1352 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_3/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Jacob really think the spinach is? +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_3/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..725ba4bcaeeaff1cae42baa66946e06f9d52dfb7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_3/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Jackson think Jacob thinks the spinach is? +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_3/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..30658bf7b7c6b5dab06fdd3c822a017d302eefa3 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_3/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Jack think Jackson thinks Jacob thinks the spinach is? +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_3/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..103dfe8271623a1640b151c3ab4ac140a75cb6d7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_3/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Ella think Jack thinks Jackson thinks Jacob thinks the spinach is? +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_4/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8acce8b74403e2a25c4f652a77c732b682385ab6 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_4/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where is the corn really? +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_4/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..54c6807e9a257815effb160596acdb51c38725d9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_4/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Amelia really think the corn is? +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_4/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..dae76cbff515364e8e3faa306df48cffa940760c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_4/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Nathan think Amelia thinks the corn is? +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_4/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b055be880458042697458060ace1ee9a4b1e354c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_4/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Lily think Nathan thinks Amelia thinks the corn is? +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_4/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6fb84f0c20564c9c6c4e1acb0a7330ce2926300f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_4/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Alexander think Lily thinks Nathan thinks Amelia thinks the corn is? +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_5/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..87796ce42dba4b88251638407a7f2995a752f47b --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_5/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where is the sweet_potato really? +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_5/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6101885284f6076b8860312029eab51370c31821 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_5/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Sophia really think the sweet_potato is? +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_5/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6e52fcdcae797393df33d453b6e580eb3ab1203f --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_5/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Jackson think Sophia thinks the sweet_potato is? +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_5/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..829de35b917a8d927599f80c4d74815feae0b536 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_5/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Avery think Jackson thinks Sophia thinks the sweet_potato is? +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_5/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c8ea1fe9816466517262a19794ab363c35909bce --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_5/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Hannah think Avery thinks Jackson thinks Sophia thinks the sweet_potato is? +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_6/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..598d72a7dbcdf69ad6e9648eb5720b0e1e53c1bc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_6/order_0.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where is the orange really? +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_6/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c87d7ee94ffdc9cb54f12fbc9f99390c2d9e2a7e --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_6/order_1.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Owen really think the orange is? +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_6/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..916fe3e015f96d87f6c92804bebbfe7547536e6c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_6/order_2.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Isabella think Owen thinks the orange is? +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_6/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c3c9f73eb76fa45b2bd69616396c6b2705d04ff5 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_6/order_3.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Jacob think Isabella thinks Owen thinks the orange is? +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_6/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6dc7964883a0e24eb8ac68efa398075596c25695 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_6/order_4.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Hannah think Jacob thinks Isabella thinks Owen thinks the orange is? +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_7/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..96c47d463fc98d32f1106f04a95892c473f242f1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_7/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where is the lime really? +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_7/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ecfc656ae6d4e1ce6f55a98dbd540ef124e7c3e9 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_7/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Amelia really think the lime is? +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_7/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..784dbbff31629d42a2884b66a909950c3638cd82 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_7/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Sophia think Amelia thinks the lime is? +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_7/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2e157f9b20e6635232caa28aa61ba8b893928bd1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_7/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Chloe think Sophia thinks Amelia thinks the lime is? +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_7/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..234485dc0e0cc2aa897cf1fc9be7d9c5999726a1 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_7/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Isabella think Chloe thinks Sophia thinks Amelia thinks the lime is? +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_8/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b2b140ca572c03d0e50d88cced677554d83f9acc --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_8/order_0.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where is the carrot really? +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_8/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4ee0a6871df28f0cde0d57e5c3f2d97ea4417fd7 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_8/order_1.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Chloe really think the carrot is? +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_8/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1e3a912180b88ea0a9e9111ff05eb82097ad50bf --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_8/order_2.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Amelia think Chloe thinks the carrot is? +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_8/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..bdf58058158a500baddaa14f97d8470bee6c391c --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_8/order_3.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Avery think Amelia thinks Chloe thinks the carrot is? +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_8/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..02ece7785bcf5191782d121debc997251b34e79a --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_8/order_4.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Sophia think Avery thinks Amelia thinks Chloe thinks the carrot is? +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_9/order_0.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a7e0c822146488347e2bf984c6208eed70b03e20 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_9/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where is the watermelon really? +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_9/order_1.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..45d1a1c0420b7696cfc5b8179a03287365e46071 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_9/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Isla really think the watermelon is? +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_9/order_2.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..302be446002081c9d2fc650047f020599c42bc94 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_9/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Carter think Isla thinks the watermelon is? +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_9/order_3.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..217e2864155e3230bada5c88f3eb479a27b32b48 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_9/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Elizabeth think Carter thinks Isla thinks the watermelon is? +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_9/order_4.txt b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e2e741eb5eac4337e7320b9fca57a9a933b4efb0 --- /dev/null +++ b/ToMh_dataset/Hi-ToM_prompts/Tell/MC/length_3/sample_9/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Please provide answer without explanations. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Nathan think Elizabeth thinks Carter thinks Isla thinks the watermelon is? +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. diff --git a/ToMh_dataset/README.md b/ToMh_dataset/README.md new file mode 100644 index 0000000000000000000000000000000000000000..dfe672010f7fec3e6cf1343493c9194781eb2539 --- /dev/null +++ b/ToMh_dataset/README.md @@ -0,0 +1,25 @@ +# Hi-ToM Dataset + +This is the dataset for the paper "Hi-ToM: A Benchmark for Evaluating Higher-Order Theory of Mind Reasoning in Large Language Models". + + + +### The `Hi-ToM_data` folder + +Contains ToMh data consisting of story-question pairs and the corresponding answers. +The names of subfolder branches have the following meanings: + +- `Tell` / `No_Tell`: whether or not the stories contain communications among agents. +- `MC` / `CoT`: the prompting style. `MC` corresponds to Vanilla Prompting (VP) in the paper, while `CoT` stands for Chain-of-Thought Prompting (CoTP). +- `length_n`: the story length, i.e. the number of chapters in a story. From 1 to 3. +- `sample_n`: the numbering of different sample stories. +- `order_n`: the ToM order of the question. From 0 to 4. + +### The `Hi-ToM_prompt` folder + +Contains prompt files that can be directly input to API. +The data in it are almost the same as `Hi-ToM_data`, except that answers are eliminated. + +### Generate new data and prompts + +Run the script `generate_tomh.sh`. diff --git a/ToMh_dataset/__pycache__/stringify.cpython-38.pyc b/ToMh_dataset/__pycache__/stringify.cpython-38.pyc new file mode 100644 index 0000000000000000000000000000000000000000..2c1de56826c1e0650927fbe7011d39a60569e9c7 Binary files /dev/null and b/ToMh_dataset/__pycache__/stringify.cpython-38.pyc differ diff --git a/ToMh_dataset/actions.py b/ToMh_dataset/actions.py new file mode 100644 index 0000000000000000000000000000000000000000..1cdde554eff138cbf155c05a48ab2e5bf30f6826 --- /dev/null +++ b/ToMh_dataset/actions.py @@ -0,0 +1,270 @@ +import numpy as np + + +class Action(object): + + def __init__(self, templates): + self.templates = templates + + def render_declarative(self, *args): + assert 'declarative' in self.templates and \ + len(self.templates['declarative']) > 0 + return np.random.choice(self.templates['declarative']) % args + + def render_interrogative(self, *args): + assert 'interrogative' in self.templates and \ + len(self.templates['interrogative']) > 0, str(self.templates) + return np.random.choice(self.templates['interrogative']) % args + + +class ExistBeginning(Action): + + def __init__(self): + templates = { + 'interrogative': [ + 'Where was the %s at the beginning?\t%s', + 'Where was the %s before?\t%s', + ] + } + super().__init__(templates) + + +class Exist(Action): + + def __init__(self): + templates = { + 'interrogative': [ + 'Where is the %s?\t%s', + 'Where is the %s located?\t%s', + ] + } + super().__init__(templates) + + +class PlaceAction(Action): + + def __init__(self): + templates = { + 'declarative': [ + '%s placed the %s in the %s.', + '%s put the %s in the %s.', + ], + 'interrogative': [ + 'Where did %s place the %s?\t%s', + 'Where did %s put the %s?\t%s', + ] + } + super().__init__(templates) + + +class SearchAction(Action): + + def __init__(self): + templates = { + 'declarative': [ + '%s searched for the %s in the %s.', + '%s looked for the %s in the %s.', + ], + 'interrogative': [ + 'Where did %s search for the %s?\t%s', + 'Where did %s look for the %s?\t%s', + ], + } + super().__init__(templates) + + +class TransportAction(Action): + + def __init__(self): + templates = { + 'declarative': [ + '%s shifted the %s from the %s to the %s.', + ], + } + super().__init__(templates) + + +class EnterAction(Action): + + def __init__(self): + templates = { + 'declarative': [ + '%s entered the %s.', + '%s came into the %s.', + ], + } + super().__init__(templates) + + +class ExitAction(Action): + + def __init__(self): + templates = { + 'declarative': [ + '%s exited the %s.', + '%s left the %s.', + '%s went out of the %s.', + ], + } + super().__init__(templates) + + +class BelieveLocationAction(Action): + + def __init__(self): + templates = { + 'declarative': [ + '%s thinks the %s is in the %s.', + '%s believes the %s is in the %s.', + ], + 'interrogative': [ + 'Where does %s think the %s is?\t%s', + 'Where does %s believe the %s is?\t%s', + ], + } + super().__init__(templates) + + +class BelieveAgentBelieveLocationAction(Action): + + def __init__(self): + templates = { + 'interrogative': [ + 'Where does %s think that %s believes the %s is?\t%s', + 'Where does %s believe that %s believes the %s is?\t%s', + 'Where does %s think that %s thinks the %s is?\t%s', + 'Where does %s believe that %s thinks the %s is?\t%s', + ], + } + super().__init__(templates) + + +class BelieveAgentSearchLocationAction(Action): + + def __init__(self): + templates = { + 'interrogative': [ + 'Where does %s think that %s looks for the %s?\t%s', + 'Where does %s believe that %s looks for the %s?\t%s', + 'Where does %s think that %s searches for the %s?\t%s', + 'Where does %s believe that %s search for the %s?\t%s', + ], + } + super().__init__(templates) + + +class InformLocationAction(Action): + + def __init__(self): + templates = { + 'declarative': [ + '%s told %s that the %s is in the %s.', + '%s informed %s that the %s is in the %s.', + ], + } + super().__init__(templates) + +#################################################### +####### Deterministic Actions for New Task ####### +#################################################### + +class FirstQ(Action): + + def __init__(self): + templates = { + 'interrogative': [ + 'Where will %s look for the %s?\t%s', + ] + } + super().__init__(templates) + +class SecondQ(Action): + + def __init__(self): + templates = { + 'interrogative': [ + 'Where does %s think that %s searches for the %s?\t%s', + ] + } + super().__init__(templates) + +class ZeroQ(Action): + + def __init__(self): + templates = { + 'interrogative': [ + 'Where is the %s really?\t%s', + ] + } + super().__init__(templates) + +class MemoryAction(Action): + + def __init__(self): + templates = { + 'interrogative': [ + 'Where was the %s at the beginning?\t%s', + ] + } + super().__init__(templates) + +class LocationAction(Action): + + def __init__(self): + templates = { + 'declarative': [ + '%s and %s are in the %s.', + ] + } + super().__init__(templates) + +class ObjectLocAction(Action): + + def __init__(self): + templates = { + 'declarative': [ + 'The %s is in the %s.', + ] + } + super().__init__(templates) + +class ExitedAction(Action): + + def __init__(self): + templates = { + 'declarative': [ + '%s exited the %s.', + ] + } + super().__init__(templates) + +class MoveAction(Action): + + def __init__(self): + templates = { + 'declarative': [ + '%s moved the %s to the %s.', + ] + } + super().__init__(templates) + +class TellAction(Action): + + def __init__(self): + templates = { + 'declarative': [ + '%s told %s where the %s is.', + ] + } + super().__init__(templates) + +class EnterAction(Action): + + def __init__(self): + templates = { + 'declarative': [ + '%s entered the %s.', + ] + } + super().__init__(templates) + \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo.zip b/ToMh_dataset/check_GPT-3.5-turbo.zip new file mode 100644 index 0000000000000000000000000000000000000000..83e00ed840d2a70b896c81934ade86d27e4596b0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c33dc03cf7eb9ffba42469bcecb08707031bfea82430ac0f4f66d1642ae602fc +size 1534526 diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_1/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d2456458ead1ba30461759716b80bd690ce9ec13 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_1/order_0.txt @@ -0,0 +1,27 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where is the lettuce really? +Answer: green_drawer +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: To answer this question, we need to follow the movements of the agents and determine where the lettuce ended up. Avery initially moved the lettuce to the green bathtub, then Charlotte moved it to the blue pantry, and finally, Owen moved it back to the green drawer. Therefore, the lettuce is really in the green drawer. The answer is K. green_drawer. + +a: \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_1/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..df981d8e5e8e98b543fd51f1743bc05bcb8d456b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_1/order_1.txt @@ -0,0 +1,27 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Avery really think the lettuce is? +Answer: green_bathtub +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: To answer this question, we need to track Avery's movements and any interactions she had with other agents regarding the lettuce. According to the story, Avery initially moved the lettuce to the green_bathtub, but later exited the living_room. There is no mention of Avery having any private or public interactions with other agents regarding the lettuce. Therefore, we can assume that Avery's actual thought about the lettuce's location is where she last placed it, which is the green_bathtub. Therefore, the correct answer is O. green_bathtub. + +a: \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_1/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c2615ff5633a2ca35e3910ab8df8cda93044e6cf --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_1/order_2.txt @@ -0,0 +1,27 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Charlotte think Avery thinks the lettuce is? +Answer: green_bathtub +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: To answer this question, we need to track the movements of Avery and the lettuce. Avery initially moved the lettuce to the green bathtub, but later exited the living room. Charlotte then moved the lettuce to the blue pantry. We don't know if Charlotte had any private or public interactions with Avery after he left the living room, so we can't be sure what she thinks about where Avery thinks the lettuce is. However, we do know that Charlotte exited the living room after Avery did, so she may be more likely to trust his judgment. Therefore, the answer is likely either green_bathtub or blue_pantry. Since Charlotte moved the lettuce to the blue pantry, it's possible that she thinks Avery also believes the lettuce is in the blue pantry. Therefore, the answer is L. blue_pantry. + +a: 5 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_1/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..34b797f60cd7a30fb9f04f2ce74797969a9ecb99 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_1/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Owen think Charlotte thinks Avery thinks the lettuce is? +Answer: green_bathtub +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +***Correct answer: green_bathtub +GPT-4 Explain: To answer this question, we need to track the movements of Avery, Charlotte, and Owen regarding the lettuce. Avery initially moved the lettuce to the green bathtub, then exited the living room. Charlotte then moved the lettuce to the blue pantry before exiting the living room. Finally, Owen moved the lettuce back to the green drawer before exiting the living room. + +Based on the assumption that agents tend to trust those who exit the room later than themselves, we can assume that Owen trusts Charlotte's movements more than Avery's. Therefore, Owen likely thinks that Charlotte thinks the lettuce is in the blue pantry, where she last moved it before exiting the living room. + +However, we also need to consider the fact that agents tend to lie and that we cannot directly infer another agent's thoughts unless they have had private or public interactions. Therefore, we cannot be certain of Owen's actual thoughts on where Charlotte thinks Avery thinks the lettuce is. + +Based on the given options, the answer would be L. blue_pantry. + +a: 5 9 6 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_1/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f5b1b564bc10ffef7701169a3ae704eea37114af --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_1/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Isabella think Owen thinks Charlotte thinks Avery thinks the lettuce is? +Answer: green_bathtub +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +***Correct answer: green_bathtub +GPT-4 Explain: To solve this question, we need to track the movements of each agent and their likes/dislikes. Isabella made no movements and stayed in the living room for 1 minute, so she witnessed all the movements of other agents. Owen likes the green envelope and dislikes the green pepper. Avery moved the lettuce to the green bathtub, then exited the living room. Charlotte moved the lettuce to the blue pantry, then exited the living room. Elizabeth dislikes the tangerine and made no movements for 1 minute before exiting the living room. Owen moved the lettuce to the green drawer, then exited the living room with all other agents. + +Now, we need to use the assumptions to infer what Isabella thinks Owen thinks Charlotte thinks Avery thinks about the lettuce's location. Isabella and Owen were in the living room together, so Isabella can infer Owen's thoughts. Owen exited the living room after Avery, so Isabella can trust Owen's claims more than Avery's. Charlotte moved the lettuce after Avery, so Isabella can trust Charlotte's claims more than Avery's. Therefore, Isabella thinks Owen thinks Charlotte thinks the lettuce is in the blue pantry, which is where Charlotte moved it. + +The answer is L. blue_pantry. + +a: 5 9 6 7 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_10/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..aadfb2cba6be25eb086b06d8485b1eeed8c926bd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_10/order_0.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where is the plum really? +Answer: red_pantry +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: To answer this question, we need to track the movements of each agent and their interactions with the plum. From the story, we know that the plum was initially in the red_pantry, but Evelyn moved it to the green_bucket. Jacob later moved the plum back to the red_pantry before all the agents exited to the waiting_room. Therefore, the plum is really in the red_pantry. The answer is G. red_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_10/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2d7229e35c3b3ca7ffa3d5b08e3f34350e78a78b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_10/order_1.txt @@ -0,0 +1,27 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does William really think the plum is? +Answer: green_bucket +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: To answer this question, we need to analyze the movements and actions of each character in the story and their possible interactions with each other. We know that the plum was initially in the red_pantry, but Evelyn moved it to the green_bucket. Nathan saw a mouse and Evelyn saw a monkey, but we don't know if they interacted with each other or with any other character. William made no movements and stayed in the pantry for 1 minute, but we don't know if he saw the plum or if he interacted with any other character who saw the plum. Emily disliked the plum and made no movements before exiting the pantry. Jacob moved the plum back to the red_pantry before exiting the pantry with the other characters. + +Based on these assumptions, we can infer that William may have seen the plum in the red_pantry before Jacob moved it back. However, we cannot be certain of this as William made no movements and we don't know if he interacted with any other character who saw the plum. Therefore, the answer to the question is A. red_drawer, as this is the only option that corresponds to the red_pantry where the plum was initially located. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_10/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9c7b9d58db9f40f980ac31d2178b26edecd2d6ad --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_10/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does Nathan think William thinks the plum is? +Answer: red_pantry +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: To answer this question, we need to track the movements of Nathan and William and the location of the plum. Nathan and William both entered the pantry and stayed there for 1 minute each. Evelyn moved the plum from the red_pantry to the green_bucket before exiting the pantry. Jacob moved the plum back to the red_pantry before exiting the pantry. Emily also entered the pantry but made no movements before exiting. Nathan saw a mouse and made no movements before exiting the pantry. Based on the assumption that agents tend to trust those who exit the room later than themselves, Nathan would trust William's thoughts more than Emily's or Jacob's. + +Since William did not make any movements in the pantry, we cannot determine his thoughts based on his actions. However, we can infer his thoughts based on the actions of others and the location of the plum. Since Evelyn moved the plum to the green_bucket before exiting the pantry, William may think that the plum is in the green_bucket. However, Jacob moved the plum back to the red_pantry before exiting the pantry, so William may also think that the plum is in the red_pantry. + +Therefore, Nathan may think that William thinks the plum is either in the green_bucket or the red_pantry. The answer choices are locations, so the possible answers are G (red_pantry) or I (green_bucket). + +The answer is either G or I, depending on what William thinks. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_10/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..24da83a6786c5376ad181160ab34d8569a37cab7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_10/order_3.txt @@ -0,0 +1,61 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does Evelyn think Nathan thinks William thinks the plum is? +Answer: red_pantry +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Where does Evelyn think Nathan thinks William thinks the plum is? + +2. We know that Nathan saw a mouse and Evelyn saw a monkey, but this information is not relevant to the question. + +3. We need to focus on the movements of the plum and the agents in the story. + +4. According to the story, the plum was initially in the red_pantry, but Evelyn moved it to the green_bucket. + +5. Nathan made no movements in the pantry, so we don't know where he thinks the plum is. + +6. William also made no movements in the pantry, so we don't know where he thinks the plum is. + +7. Emily dislikes the plum and made no movements in the pantry, so we don't know where she thinks the plum is. + +8. Jacob moved the plum back to the red_pantry before exiting the pantry. + +9. Evelyn exited the pantry after moving the plum to the green_bucket. + +10. Nathan exited the pantry before Evelyn. + +11. William exited the pantry after Evelyn. + +12. Emily exited the pantry before William. + +13. Based on the assumptions, we know that agents tend to trust agents who exited the room later than themselves. + +14. Therefore, Evelyn is more likely to trust William's opinion on the location of the plum than Nathan's opinion. + +15. However, we still don't know where William thinks the plum is. + +16. We can infer that Evelyn thinks William thinks the plum is in the green_bucket, since that is where she moved it to and she exited the pantry before William. + +17. Therefore, the answer is I. green_bucket. + +To summarize, the question requires careful analysis of the story and assumptions, as well as logical reasoning to infer the answer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_10/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9cc703536a1a467f1cf727c904bfd0e13cf3522c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_10/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does Jacob think Evelyn thinks Nathan thinks William thinks the plum is? +Answer: red_pantry +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Jacob think Evelyn thinks Nathan thinks William thinks the plum is? + +2. We need to start with Jacob's perspective. According to the story, Jacob moved the plum to the red_pantry before leaving the pantry. So, Jacob thinks the plum is in the red_pantry. + +3. Now we need to consider what Evelyn thinks. According to the story, Evelyn saw the plum in the red_pantry, but then moved it to the green_bucket before leaving the pantry. So, Evelyn knows that the plum was in the red_pantry, but she may or may not think it's still there. + +4. Next, we need to consider what Nathan thinks. According to the story, Nathan made no movements in the pantry, but he saw a mouse. There is no information about what Nathan thinks about the plum. + +5. Now we need to consider what William thinks. According to the story, William made no movements in the pantry, and there is no information about what he thinks about the plum. + +6. Based on the assumptions, we know that Jacob can only infer what Nathan thinks if they had a private or public interaction. There is no information about any such interaction, so we cannot determine what Nathan thinks about the plum. + +7. Similarly, Jacob can only infer what William thinks if they had a private or public interaction. There is no information about any such interaction, so we cannot determine what William thinks about the plum. + +8. Therefore, we cannot determine where Jacob thinks Evelyn thinks Nathan thinks William thinks the plum is. + +9. The answer is none of the above (not listed). \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_11/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0b4ac3ade1fc4bbc3b94cac683e6f6c47f4d317e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_11/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where is the orange really? +Answer: red_box +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: To solve this question, we need to track the movements of the agents and their actions related to the orange. According to the story, the orange was initially in the red_box. Benjamin moved the orange to the red_envelope before he exited the study. Then, Elizabeth moved the orange back to the red_box before she exited the study. Therefore, the orange is really in the red_box. The answer is F. red_box. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_11/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cffcff1e0edbaa85077468e2a9f420a2a21afc8c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_11/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Ella really think the orange is? +Answer: red_envelope +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: To answer this question, we need to track the movements of the orange and the agents. According to the story, the orange was initially in the red_box (step 2). Then, Benjamin moved the orange to the red_envelope (step 6), and finally, Elizabeth moved the orange back to the red_box (step 13). + +Ella made no movements in the study and stayed there for one minute (step 10), so she did not physically interact with the orange. However, we can infer her thoughts based on the actions of the other agents. + +Chloe did not move the orange (step 3) and left the study before Benjamin moved the orange (step 5), so she does not know where the orange is. Alexander also did not move the orange (step 8) and left the study before Elizabeth moved the orange back to the red_box (step 9), so he also does not know where the orange is. + +Benjamin moved the orange to the red_envelope (step 6) and saw a cat (step 11) before leaving the study. Elizabeth moved the orange back to the red_box (step 13) before leaving the study. + +Since Ella did not physically interact with the orange, we can assume that her thoughts about the orange's location are based on the actions of Benjamin and Elizabeth. Benjamin moved the orange to the red_envelope, but he left the study before Elizabeth moved the orange back to the red_box. Therefore, Ella would think that the orange is still in the red_envelope. + +The answer is H. red_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_11/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..46c37746bfcb89d5dc295aa812d44b7c036131e9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_11/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Elizabeth think Ella thinks the orange is? +Answer: red_envelope +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: To answer this question, we need to track the movements of the agents and the location of the orange. From the story, we know that Chloe, Benjamin, Alexander, Ella, and Elizabeth entered the study. The orange was initially in the red_box. Chloe made no movements and stayed in the study for 1 minute before exiting. Alexander lost his phone and stayed in the study for 1 minute before exiting. Benjamin moved the orange to the red_envelope before exiting. Ella made no movements and stayed in the study for 1 minute before exiting. Elizabeth moved the orange back to the red_box before exiting. + +Therefore, Elizabeth knows that the orange is in the red_box when she exits the study. However, we need to determine where Elizabeth thinks Ella thinks the orange is. We know that Benjamin saw a cat and Ella made no movements before exiting the study. Therefore, Elizabeth has no reason to believe that Ella knows the orange was moved to the red_envelope by Benjamin. + +Based on the given options, the only logical answer is F. red_box, as that is where Elizabeth knows the orange is and she has no reason to believe that Ella knows otherwise. Therefore, Elizabeth would think that Ella thinks the orange is in the red_box. + +The answer is F. red_box. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_11/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c756874e56788d9a32c7076ce10f3700ba9d3fed --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_11/order_3.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Chloe think Elizabeth thinks Ella thinks the orange is? +Answer: red_box +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Chloe, Benjamin, Alexander, Ella, and Elizabeth entered the study. +2. The orange is in the red_box. +3. Chloe made no movements and stayed in the study for 1 minute. +4. Alexander lost his phone. +5. Chloe exited the study. +6. Benjamin moved the orange to the red_envelope. +7. Benjamin exited the study. +8. Alexander made no movements and stayed in the study for 1 minute. +9. Alexander exited the study. +10. Ella made no movements and stayed in the study for 1 minute. +11. Benjamin saw a cat. +12. Ella exited the study. +13. Elizabeth moved the orange to the red_box. +14. Elizabeth exited the study. +15. Chloe, Benjamin, Alexander, Ella, and Elizabeth entered the waiting_room. + +Based on the story and assumptions, we know that Chloe can only infer Elizabeth's thoughts if they were in the same place or had private or public interactions. We also know that Chloe tends to lie, so we cannot trust what she says. + +We need to determine where Elizabeth thinks Ella thinks the orange is. We know that Elizabeth moved the orange to the red_box, but we don't know what she thinks about where Ella thinks the orange is. + +We need to look for clues in the story. Ella made no movements and stayed in the study for 1 minute, so she didn't move the orange. Benjamin moved the orange to the red_envelope, but we don't know what he thinks about where Ella thinks the orange is. Alexander made no movements and stayed in the study for 1 minute, so he didn't move the orange either. + +The only clue we have is that Benjamin saw a cat, but this doesn't help us determine where Elizabeth thinks Ella thinks the orange is. + +Therefore, we cannot answer this question based on the information given in the story and assumptions. The answer is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_11/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ee2d1cf7613d615c0910c6a128d34b614b85cfbe --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_11/order_4.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Alexander think Chloe thinks Elizabeth thinks Ella thinks the orange is? +Answer: red_box +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. To start, we need to identify the order of events and the movements of each character: + +1. Chloe, Benjamin, Alexander, Ella, and Elizabeth enter the study. +2. The orange is in the red_box. +3. Chloe stays in the study for 1 minute and makes no movements. +4. Alexander loses his phone. +5. Chloe exits the study. +6. Benjamin moves the orange to the red_envelope. +7. Benjamin exits the study. +8. Alexander stays in the study for 1 minute and makes no movements. +9. Alexander exits the study. +10. Ella stays in the study for 1 minute and makes no movements. +11. Benjamin sees a cat. +12. Ella exits the study. +13. Elizabeth moves the orange to the red_box. +14. Elizabeth exits the study. +15. Chloe, Benjamin, Alexander, Ella, and Elizabeth enter the waiting_room. + +Based on these events, we can make some inferences about what each character knows and thinks: + +- Chloe knows that the orange was in the red_box when she entered the study, but she doesn't know that Benjamin moved it to the red_envelope. +- Alexander doesn't know where the orange is, but he knows that Chloe was in the study before him and that she didn't move the orange. +- Ella doesn't know where the orange is, but she knows that Chloe and Alexander were in the study before her and that they didn't move the orange. +- Elizabeth knows that the orange was in the red_box when she entered the study, but she doesn't know that Benjamin moved it to the red_envelope. + +Now we can try to answer the question. We need to work backwards from Elizabeth to Chloe, making sure to take into account what each character knows and what they might think based on that knowledge. + +- Elizabeth knows that she moved the orange to the red_box, so she thinks the orange is in the red_box. +- Ella doesn't know where the orange is, but she knows that Elizabeth moved it to the red_box, so she might think the orange is in the red_box. +- Alexander doesn't know where the orange is, but he knows that Ella was in the study after Chloe and that she might think the orange is in the red_box, so he might think that Chloe thinks Ella thinks the orange is in the red_box. +- Chloe knows that the orange was in the red_box when she entered the study, but she doesn't know that Benjamin moved it to the red_envelope. She also knows that Alexander was in the study after her and that he might think she thinks the orange is in the red_box. However, she might also suspect that Benjamin moved the orange, so she might think that Elizabeth thinks the orange is in the red_box (since she moved it there) or that Ella thinks the orange is in the red_envelope (since she didn't see Benjamin move it). + +Based on this analysis, the answer is either A. red_bottle (if Chloe thinks Elizabeth thinks the orange is in the red_box) or H. red_envelope (if Chloe thinks Ella thinks the orange is in the red_envelope). \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_12/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2f97007f7082e4911c5a3a08415d3b5e480b2e2a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_12/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where is the melon really? +Answer: red_bottle +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bottle +GPT-4 Explain: To answer this question, we need to track the movements of each agent and their actions in the garden. Mila did not move and left the garden without doing anything. Ava moved the melon to the green_basket. Liam did not move and left the garden without doing anything. Ella moved the melon to the red_bottle. William did not move and left the garden without doing anything. Therefore, the melon is in either the green_basket or the red_bottle. The correct answer is either F or I. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_12/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cfc34da101aeb98648b0750572ef9a230df2448d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_12/order_1.txt @@ -0,0 +1,27 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does William really think the melon is? +Answer: red_bottle +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bottle +GPT-4 Explain: To answer this question, we need to track the movements of each agent and their interactions with the melon. Mila did not move the melon and left the garden before any other agent moved the melon. Ava moved the melon to the green_basket before leaving the garden. Liam did not move the melon and left the garden after Ava. Ella moved the melon to the red_bottle before leaving the garden. William did not move the melon and left the garden after Ella. + +Since William did not move the melon, he must rely on the information he received from the other agents. Ava moved the melon to the green_basket before leaving the garden, and Ella moved the melon to the red_bottle before leaving the garden. Since William trusts agents who exited the garden after him, he would trust Ella's claim that the melon is in the red_bottle. Therefore, William really thinks the melon is in the red_bottle (option I). + +The correct answer is I. red_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_12/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2840323e5f63af23f5ffe7e39f2a8c0963e80ae6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_12/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does Mila think William thinks the melon is? +Answer: green_box +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: To answer this question, we need to track the movements of Mila and William and their interactions with the melon. Mila entered the garden with William and the others, but made no movements and stayed for only one minute before exiting. William also made no movements and stayed for one minute before exiting. Therefore, Mila and William did not interact with each other or the melon while in the garden. + +Next, we need to look at the movements of the other agents. Ava moved the melon to the green_basket, and Ella moved the melon to the red_bottle. Liam made no movements and stayed in the garden for one minute, but saw a mouse. + +Since Mila did not interact with the melon and William made no movements, we cannot determine where William thinks the melon is based on their actions alone. However, we can make some inferences based on the actions of the other agents. + +Ava moved the melon to the green_basket, but we do not know if William saw this happen or if he was in the garden at the time. Ella moved the melon to the red_bottle, but we do not know if William saw this happen or if he was still in the garden at the time. Liam saw a mouse, but we do not know if he saw the melon or where he thinks it is. + +Therefore, we cannot determine where Mila thinks William thinks the melon is based on the given information. The answer is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_12/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..397abc5bf51cfd3511f1fa1b330c1badba1f26ef --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_12/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does Ella think Mila thinks William thinks the melon is? +Answer: green_box +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Where does Ella think Mila thinks William thinks the melon is? + +2. To answer this question, we need to first determine where each agent was when they interacted with the melon. + +3. Mila made no movements and stayed in the garden for 1 minute, so she did not interact with the melon. + +4. Ava moved the melon to the green_basket before exiting the garden. + +5. Liam made no movements and stayed in the garden for 1 minute, so he did not interact with the melon. + +6. Ella moved the melon to the red_bottle before exiting the garden. + +7. William made no movements and stayed in the garden for 1 minute, so he did not interact with the melon. + +8. Based on the assumptions, we know that Ella can only infer William's thoughts if they were in the same place or had private or public interactions. + +9. Since Ella moved the melon after Ava, she would trust Ava's exit order more than William's. + +10. Therefore, Ella would think that Mila thinks the melon is in the green_basket, since that is where Ava moved it and Ella would trust Ava's actions more than William's. + +11. The answer is F. green_basket. + +So, Ella thinks that Mila thinks William thinks the melon is in the green_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_12/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f71b8263bc11b2847194bcc26e02bf64b559646e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_12/order_4.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does Ava think Ella thinks Mila thinks William thinks the melon is? +Answer: green_box +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: This question requires a lot of logical reasoning and deduction. We need to trace the movements of each agent and their interactions with each other to determine where Ava thinks Ella thinks Mila thinks William thinks the melon is. + +First, we know that Mila made no movements in the garden and then exited. Therefore, she did not move the melon. + +Next, Ava moved the melon to the green_basket before exiting the garden. + +Liam made no movements in the garden and then exited. + +Ella moved the melon to the red_bottle before exiting the garden. + +William made no movements in the garden and then exited. + +Based on these movements, we can deduce that the melon was last seen in the red_bottle by Ella. However, we need to determine where Ava thinks Ella thinks Mila thinks William thinks the melon is. + +Since Ava moved the melon to the green_basket, she knows that it is not in the red_bottle. Liam made no movements in the garden, so he cannot provide any information about the melon's location. Ella moved the melon to the red_bottle, so she knows that it is not in the green_basket. William made no movements in the garden, so he cannot provide any information about the melon's location. + +Therefore, Ava thinks that Ella thinks that Mila thinks that William thinks the melon is in the green_basket. + +The answer is F. green_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_13/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a5bacc24862c99b4470000fafe64ab03dbe85b2d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_13/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where is the cabbage really? +Answer: blue_crate +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To answer this question, we need to track the movements of the cabbage and which agent moved it to which location. According to the story, Amelia moved the cabbage from the red_container to the green_envelope, and then Abigail moved it from the green_envelope to the green_crate. Finally, Charlotte moved it from the green_crate to the blue_crate. Therefore, the cabbage is really in the blue_crate, which is option F. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_13/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ece961b2521bb1dbe78a5516621a88ccce70e328 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_13/order_1.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Abigail really think the cabbage is? +Answer: green_crate +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: To answer this question, we need to consider the movements of each agent and their potential interactions with each other. According to the story, Amelia moved the cabbage from the red_container to the green_envelope, and Abigail then moved it from the green_envelope to the green_crate. Charlotte then moved it from the green_crate to the blue_crate. Carter and Nathan made no movements and simply stayed in the laundry for one minute before exiting. + +Based on the assumptions given, we know that Abigail may have interacted with Amelia and Charlotte, but not with Carter or Nathan. We also know that agents tend to lie, so we cannot trust what Abigail may have told the others about the cabbage's location. + +However, we do know that Abigail exited the laundry before Charlotte, and therefore may be more likely to trust Charlotte's movements. Since Charlotte moved the cabbage to the blue_crate, it is possible that Abigail believes the cabbage is in the blue_crate. + +Therefore, the answer to the question is F. blue_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_13/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..50b23a74cd7a143fff2d9e0e572dfec9474341a4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_13/order_2.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Nathan think Abigail thinks the cabbage is? +Answer: green_crate +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: To answer this question, we need to track the movements of the cabbage and the agents. Amelia moved the cabbage from the red_container to the green_envelope, and Abigail moved it from the green_envelope to the green_crate. Charlotte then moved it from the green_crate to the blue_crate. Carter and Nathan made no movements and stayed in the laundry for 1 minute before exiting. + +Since Nathan exited the laundry after Abigail, he would tend to trust her more than Amelia or Charlotte. However, we don't know if Abigail made any claims about the location of the cabbage before she exited. Therefore, we cannot infer where Nathan thinks Abigail thinks the cabbage is. + +The answer is: Cannot be determined. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_13/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..10886ba01081726a69c171efe42696fbde164c7e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_13/order_3.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Amelia think Nathan thinks Abigail thinks the cabbage is? +Answer: green_envelope +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: This question requires a lot of logical reasoning and deduction. Let's break it down step by step: + +1. Where does Nathan think the cabbage is? +- We don't have any information about Nathan moving the cabbage or expressing his thoughts about it, so we can't determine where he thinks it is. + +2. Where does Abigail think the cabbage is? +- Abigail moved the cabbage to the green crate, so she definitely thinks it's in the green crate. + +3. Where does Amelia think Abigail thinks the cabbage is? +- Amelia moved the cabbage from the red container to the green envelope, so she knows it's not in the red container anymore. +- Amelia left the laundry before Abigail, so she trusts Abigail less than anyone who exited after her. +- We don't have any information about Amelia and Abigail having any private or public interactions, so we can't determine if Amelia has any reason to doubt Abigail's actions or statements. +- Therefore, Amelia most likely thinks that Abigail still thinks the cabbage is in the green crate, since that's where Abigail left it and Amelia has no reason to doubt her. + +4. Where does Amelia think Nathan thinks Abigail thinks the cabbage is? +- We don't have any information about Nathan's thoughts, but we know that Amelia trusts him less than anyone who exited after her. +- Since Abigail left the cabbage in the green crate and Amelia has no reason to doubt her, it's reasonable to assume that Nathan also thinks the cabbage is in the green crate, since he would trust Abigail's actions and statements more than Amelia's. + +Therefore, the answer is H. green_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_13/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6b2c9439db20d8279825c1d8347cfe0173d089c7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_13/order_4.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Charlotte think Amelia thinks Nathan thinks Abigail thinks the cabbage is? +Answer: green_envelope +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: This question requires a lot of steps to solve. Let's break it down: + +1. Charlotte moved the cabbage to the blue_crate. +2. Charlotte exited the laundry. +3. Nathan made no movements and stayed in the laundry for 1 minute. +4. Nathan exited the laundry. +5. Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. + +Based on the assumptions given, we know that Charlotte can only infer what Amelia thinks if they were in the same place or had private/public interactions. We also know that agents tend to lie, so we can't trust what they say. + +We don't have any information about Amelia's thoughts on the cabbage, but we do know that Abigail moved the cabbage to the green_crate after Amelia moved it to the green_envelope. This means that Abigail thinks the cabbage is in the green_crate, but we can't trust that this is actually true. + +Since Nathan and Carter made no movements in the laundry, we don't have any information about their thoughts on the cabbage. + +When Charlotte moved the cabbage to the blue_crate, she could have thought that the cabbage was in any of the previous locations (red_container, green_envelope, or green_crate) or she could have thought that it was in a completely different location. We don't have any information to suggest where she thought the cabbage was. + +Therefore, we can't determine where Charlotte thinks Amelia thinks Nathan thinks Abigail thinks the cabbage is. The answer is inconclusive. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_14/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9530594820936937be6c542ff7de1f9f9bd4c252 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_14/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where is the lime really? +Answer: green_envelope +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To answer this question, we need to track the movements of the lime and the agents. Emily moved the lime from the green_envelope to the blue_pantry, and then Jack moved it from the blue_pantry to the blue_suitcase. Abigail then moved the lime from the blue_suitcase to the green_envelope. Therefore, the lime is really in the green_envelope. The answer is K. green_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_14/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6fc3ee0a6ba84067cf907f8eef997fb6def63db3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_14/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Abigail really think the lime is? +Answer: green_envelope +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To answer this question, we need to trace the movements of the lime and the agents. Emily moved the lime from the green_envelope to the blue_pantry, and Jack moved it from there to the blue_suitcase. Abigail then moved the lime back to the green_envelope before all agents exited the playroom. We know that Emily likes the green_crate and Avery likes the red_basket, but we don't have any information about the preferences of Jack, Aiden, or Abigail. Therefore, we cannot infer Abigail's thoughts based on her preferences. However, we do know that Abigail moved the lime to the green_envelope before leaving the playroom. Therefore, the answer is K. green_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_14/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..0007e34929f15a7bdd19b20fdd56f20d0bfff1b1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_14/order_2.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Avery think Abigail thinks the lime is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to track the movements of the lime and the agents and their thoughts. + +1. Emily, Jack, Avery, Aiden, and Abigail entered the playroom. +2. The lime is in the green_envelope. +3. Emily moved the lime to the blue_pantry. +4. Emily exited the playroom. +5. Jack moved the lime to the blue_suitcase. +6. Jack exited the playroom. +7. Avery made no movements and stayed in the playroom for 1 minute. +8. Avery exited the playroom. +9. Emily likes the green_crate. +10. Aiden made no movements and stayed in the playroom for 1 minute. +11. Aiden exited the playroom. +12. Avery likes the red_basket. +13. Abigail moved the lime to the green_envelope. +14. Abigail exited the playroom. +15. Emily, Jack, Avery, Aiden, and Abigail entered the waiting_room. + +Based on the assumptions, we know that Avery can only infer Abigail's thought if they have been in the same place or have had private or public interactions. We also know that agents tend to lie, so what they tell others doesn't necessarily reflect their actual thoughts. + +We don't have any information about Avery and Abigail being in the same place or having private interactions, so we need to look for any public interactions or movements that might give us a clue. + +The lime starts in the green_envelope and is moved by Emily to the blue_pantry, then by Jack to the blue_suitcase, and finally by Abigail back to the green_envelope. Avery makes no movements and stays in the playroom for 1 minute. + +We know that Emily likes the green_crate and Avery likes the red_basket, but we don't have any information about Abigail's preferences. + +Based on the movements of the lime and the fact that Avery makes no movements, it's possible that Avery didn't see Abigail move the lime back to the green_envelope. Therefore, Avery might still think that the lime is in the blue_suitcase, which is the last place he saw it. + +Therefore, the answer is (M) blue_suitcase. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_14/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..164b62c7ae21186428bd35e2f3bd4ebf3376e799 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_14/order_3.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Jack think Avery thinks Abigail thinks the lime is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To solve this question, we need to track the movements of the agents and their thoughts. + +1. Emily, Jack, Avery, Aiden, and Abigail entered the playroom. +2. The lime is in the green_envelope. +3. Emily moved the lime to the blue_pantry. +4. Emily exited the playroom. +5. Jack moved the lime to the blue_suitcase. +6. Jack exited the playroom. +7. Avery made no movements and stayed in the playroom for 1 minute. +8. Avery exited the playroom. +9. Emily likes the green_crate. +10. Aiden made no movements and stayed in the playroom for 1 minute. +11. Aiden exited the playroom. +12. Avery likes the red_basket. +13. Abigail moved the lime to the green_envelope. +14. Abigail exited the playroom. +15. Emily, Jack, Avery, Aiden, and Abigail entered the waiting_room. + +From the story, we know that Jack moved the lime to the blue_suitcase and then exited the playroom. Avery made no movements and stayed in the playroom for 1 minute before exiting. Abigail moved the lime to the green_envelope before exiting. + +We also know that Avery likes the red_basket and Emily likes the green_crate. However, we don't have any information about what Jack thinks about the locations. + +To answer the question, we need to track the thoughts of the agents. Since Avery made no movements and stayed in the playroom for 1 minute, we can assume that Avery had time to think about the location of the lime. However, we don't know what Avery's actual thought is. + +Abigail moved the lime to the green_envelope, but we don't know what Abigail thinks about the location. Therefore, we cannot infer what Avery thinks Abigail thinks about the location of the lime. + +Since we don't have any information about what Jack thinks about the locations, we cannot answer the question. The answer is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_14/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..75f7657a681b9d214841c8062c755fd9516a0044 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_14/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Aiden think Jack thinks Avery thinks Abigail thinks the lime is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Aiden exited the playroom after Abigail. +2. Abigail moved the lime to the green_envelope before exiting the playroom. +3. Avery made no movements and stayed in the playroom for 1 minute before exiting. +4. Jack moved the lime to the blue_suitcase before exiting the playroom. +5. Emily moved the lime to the blue_pantry before exiting the playroom. +6. Aiden made no movements and stayed in the playroom for 1 minute before exiting. + +Based on these steps, we can infer the following: + +- Aiden knows that Abigail moved the lime to the green_envelope before leaving the playroom. +- Aiden does not know what Avery, Jack, or Emily think about the location of the lime. +- Aiden knows that Avery stayed in the playroom for 1 minute before leaving, but does not know if Avery made any movements during that time. +- Aiden knows that Jack moved the lime to the blue_suitcase before leaving the playroom. +- Aiden knows that Emily moved the lime to the blue_pantry before leaving the playroom. + +Now let's apply the assumptions to the question: + +- Aiden can only infer what Jack thinks if they were in the same place or had private/public interactions. +- Aiden knows that Jack exited the playroom before him, so he may trust Jack's opinion more than Avery's or Emily's. +- Aiden knows that Abigail moved the lime to the green_envelope, but he does not know what she thinks about its location. + +Based on this analysis, we can conclude that Aiden may think that Jack thinks the lime is in the blue_suitcase (since Jack moved it there before leaving the playroom). Aiden does not have any information about what Avery or Abigail think, so he cannot make any inferences about their opinions. Therefore, the answer is M. blue_suitcase. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_15/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b875e755c8ea92ae12e03641bedc8a7ebb58a8aa --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_15/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where is the watermelon really? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to track the movements of each agent and their interactions with the watermelon. According to the story, the watermelon was initially in the blue_container in the back_yard. Ella moved the watermelon to the red_pantry before exiting the back_yard. Then, Amelia moved the watermelon back to the blue_container before exiting the back_yard. Therefore, the watermelon is really in the blue_container. The answer is L. blue_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_15/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..23b76eb6b40503ee245a3ad10d60b309a8cbf6ba --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_15/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Avery really think the watermelon is? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to track the movements of each agent and their interactions with the watermelon. Avery entered the back_yard with the group, made no movements, and exited the back_yard before any interactions with the watermelon occurred. Therefore, Avery did not have any direct interaction with the watermelon and did not witness its movement. We cannot infer Avery's thoughts on the location of the watermelon based on the given information. The answer is not provided in the options given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_15/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..38330f2ff203d8b76201255c31849c2159701a94 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_15/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Owen think Avery thinks the watermelon is? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to track the movements of Avery and the watermelon. Avery entered the back_yard and made no movements before exiting. Therefore, Avery did not move the watermelon. Ella moved the watermelon to the red_pantry after Avery exited. Owen entered the back_yard after Avery and made no movements before exiting. Therefore, Owen did not move the watermelon either. Amelia moved the watermelon to the blue_container after Ava exited. + +Since Owen did not move the watermelon and Avery did not move the watermelon, Owen would think that Avery thinks the watermelon is still in the blue_container where it was originally placed. Therefore, the answer is L. blue_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_15/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..90f07261a719e0589756ab8ba06f0beb6abeef1f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_15/order_3.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Ella think Owen thinks Avery thinks the watermelon is? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Where does Ella think Owen thinks Avery thinks the watermelon is? + +2. We know that the watermelon is in the blue_container (from statement 2). + +3. Avery made no movements and stayed in the back_yard for 1 minute (statement 3). + +4. Avery exited the back_yard (statement 4). + +5. Owen made no movements and stayed in the back_yard for 1 minute (statement 5). + +6. Owen exited the back_yard (statement 6). + +7. Ella moved the watermelon to the red_pantry (statement 7). + +8. Ella exited the back_yard (statement 8). + +9. Ava made no movements and stayed in the back_yard for 1 minute (statement 9). + +10. Ava exited the back_yard (statement 10). + +11. Amelia moved the watermelon to the blue_container (statement 11). + +12. Amelia exited the back_yard (statement 12). + +13. Avery, Owen, Ella, Ava and Amelia entered the waiting_room (statement 13). + +Based on these statements, we can infer that Ella knows the watermelon was originally in the blue_container, but she moved it to the red_pantry. Owen and Avery were both in the back_yard before Ella moved the watermelon, but we don't know where they think it is. + +Since Ella and Owen were both in the back_yard at some point, Ella can infer Owen's thoughts based on the assumptions. However, we don't have any information about what Owen thinks, so we can't answer the question. + +Therefore, the answer is: Insufficient information to answer the question. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_15/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..fbb95d983843fdefd55bf9c54e2ff8976eb6a934 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_15/order_4.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Amelia think Ella thinks Owen thinks Avery thinks the watermelon is? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Amelia think the watermelon is? +According to step 11, Amelia moved the watermelon to the blue_container before exiting the back_yard. Therefore, Amelia thinks the watermelon is in the blue_container. + +2. Where does Amelia think Avery thinks the watermelon is? +Avery made no movements and stayed in the back_yard for 1 minute before exiting. Therefore, Avery did not see where the watermelon was moved to. Amelia moved the watermelon to the blue_container after Avery left the back_yard. Therefore, Amelia knows that Avery did not see where the watermelon was moved to. Since Avery made no movements, he did not interact with anyone else who might have seen where the watermelon was moved to. Therefore, Amelia thinks that Avery has no idea where the watermelon is. + +3. Where does Amelia think Owen thinks the watermelon is? +Owen made no movements and stayed in the back_yard for 1 minute before exiting. Therefore, Owen did not see where the watermelon was moved to. However, Owen was in the back_yard at the same time as Ella, who moved the watermelon to the red_pantry before exiting. Therefore, Owen might have seen where the watermelon was moved to. Since Owen made no movements, he did not interact with anyone else who might have seen where the watermelon was moved to. Therefore, Amelia thinks that Owen might know where the watermelon is, but she is not sure where he thinks it is. + +4. Where does Amelia think Ella thinks the watermelon is? +Ella moved the watermelon to the red_pantry before exiting the back_yard. Therefore, Ella knows that the watermelon is not in the blue_container. However, Ella did not see where Amelia moved the watermelon to after she left the back_yard. Therefore, Ella might think that the watermelon is still in the blue_container. Since Amelia knows that Avery has no idea where the watermelon is and Owen might know where it is, but she is not sure where he thinks it is, she cannot infer what Ella thinks about the location of the watermelon. Therefore, the answer is not provided in the options given. + +In conclusion, the answer is not provided in the options given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_16/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ef14200072b9f7030e45633e436902b8e9446712 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_16/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where is the carrot really? +Answer: red_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: To answer this question, we need to track the movements of the carrot and the agents. According to the story, the carrot was initially in the red_container (Step 2). Isabella moved the carrot to the blue_container (Step 3), and then Alexander moved the carrot to the green_bathtub (Step 11). Finally, Logan moved the carrot back to the red_container (Step 13). Therefore, the carrot is really in the red_container (Option B). \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_16/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d2c0ebc4d266a360d511671396fcefa643d29daa --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_16/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does William really think the carrot is? +Answer: blue_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to track the movements of the carrot and the agents. Isabella moved the carrot from the red_container to the blue_container. Then, Alexander moved the carrot from the blue_container to the green_bathtub. Finally, Logan moved the carrot from the green_bathtub back to the red_container. William made no movements in the cellar, but he exited after Evelyn and before Alexander. Therefore, he could have heard Evelyn's and Alexander's movements and claims about the carrot's location. Since Alexander moved the carrot to the green_bathtub and Logan moved it back to the red_container, it's possible that William thinks the carrot is still in the green_bathtub, but it's also possible that he thinks it's back in the red_container. However, since William exited the cellar after Evelyn and before Alexander, he may trust Alexander's claim more than Evelyn's. Therefore, the most likely answer is C. green_bathtub. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_16/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..649f9a8581a3c2a55d677bc71419a525b3524fb1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_16/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does Evelyn think William thinks the carrot is? +Answer: blue_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to track the movements of Isabella, Logan, Alexander, Evelyn, and William and the location of the carrot. We know that Isabella moved the carrot from the red_container to the blue_container, and Alexander moved the carrot from the blue_container to the green_bathtub, and Logan moved the carrot from the green_bathtub to the red_container. Evelyn made no movements, and William made no movements, so they did not move the carrot. Therefore, the carrot is in the red_container at the end of the story. + +Now we need to determine where Evelyn thinks William thinks the carrot is. Since Evelyn and William were both in the cellar, and Evelyn exited the cellar after William, she would tend to trust William's judgment more than her own. Since the carrot is in the red_container, we need to look for any clues that William may have thought the carrot was in the red_container. + +The story does not provide any direct information about William's thoughts on the location of the carrot. However, we know that Logan likes the green_bucket and the green_drawer, but he moved the carrot to the red_container. This suggests that the carrot was not in the green_bucket or the green_drawer, and William may have known this. Additionally, Isabella moved the carrot from the red_container to the blue_container, so William may have thought the carrot was originally in the red_container. + +Based on this reasoning, we can conclude that Evelyn thinks William thinks the carrot is in the red_container. Therefore, the answer is B. red_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_16/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7f72af0c3e5a605254e7a5f47719556908b7ce2f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_16/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does Logan think Evelyn thinks William thinks the carrot is? +Answer: blue_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: This question requires a lot of deduction based on the given assumptions and the story. We need to track the movements of each agent and their thoughts about the carrot's location. + +First, we know that Isabella moved the carrot from the red_container to the blue_container. Then, Alexander moved the carrot from the blue_container to the green_bathtub. Finally, Logan moved the carrot from the green_bathtub back to the red_container. + +We also know that Logan likes the green_drawer and the green_bucket, but we don't have any information about where he thinks the carrot is. + +Evelyn made no movements and stayed in the cellar for 1 minute, so we don't know where she thinks the carrot is either. However, we do know that she exited the cellar before William, who also made no movements and stayed in the cellar for 1 minute. + +Since William exited the cellar after Evelyn, Logan would tend to trust Evelyn's thoughts more than William's. But we still don't know where Evelyn thinks the carrot is. + +Based on the given options, the only location that William could think the carrot is in is the blue_container, since that's where Isabella moved it from. + +So, where does Logan think Evelyn thinks William thinks the carrot is? We don't have any direct information about this, but we can make some educated guesses. + +Logan knows that William made no movements in the cellar and stayed there for 1 minute, so he might assume that William didn't see where Isabella moved the carrot to. Therefore, Logan might think that Evelyn doesn't know where the carrot is either, since she exited the cellar before William and didn't make any movements. + +However, Logan also knows that Alexander moved the carrot to the green_bathtub, so he might think that Evelyn saw this happen and therefore knows that the carrot is in the green_bathtub. + +Therefore, the answer could be either C. green_bathtub or unknown, since we don't have enough information to say for sure what Logan thinks Evelyn thinks William thinks the carrot is. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_16/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e99218fd7023402ffc50f070d1c39f11a7dced21 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_16/order_4.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does Alexander think Logan thinks Evelyn thinks William thinks the carrot is? +Answer: blue_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: This is a complex question that requires careful analysis. We need to determine where Alexander thinks Logan thinks Evelyn thinks William thinks the carrot is. To do this, we need to track the movements of each character and their interactions with each other. + +1. Isabella, Evelyn, William, Alexander, and Logan entered the cellar. +2. The carrot is in the red_container. +3. Isabella moved the carrot to the blue_container. +4. Logan likes the green_drawer. +5. Isabella exited the cellar. +6. Evelyn made no movements and stayed in the cellar for 1 minute. +7. Logan likes the green_bucket. +8. Evelyn exited the cellar. +9. William made no movements and stayed in the cellar for 1 minute. +10. William exited the cellar. +11. Alexander moved the carrot to the green_bathtub. +12. Alexander exited the cellar. +13. Logan moved the carrot to the red_container. +14. Logan exited the cellar. +15. Isabella, Evelyn, William, Alexander, and Logan entered the waiting_room. + +Based on the assumption that agents tend to lie, we cannot trust what they say about their thoughts. Instead, we need to infer their thoughts based on their actions and interactions. + +We know that the carrot was originally in the red_container, but Isabella moved it to the blue_container. Logan then moved it back to the red_container. We also know that Logan likes the green_drawer and the green_bucket, but we don't know if he actually saw the carrot in either of those places. + +Evelyn and William made no movements in the cellar, so we don't have any information about their thoughts on the carrot's location. Alexander moved the carrot to the green_bathtub, but we don't know if he saw Logan or any of the other agents in the cellar. + +Based on the assumption that agents tend to trust those who exit the room later than themselves, Alexander may trust Logan's judgment on the carrot's location. However, we don't have any information about Evelyn or William's thoughts on the carrot's location, so we cannot use them to determine Alexander's thoughts. + +Therefore, the answer to the question is: we cannot determine where Alexander thinks Logan thinks Evelyn thinks William thinks the carrot is. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_17/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e6b8e7f79e787a98078273866e562fcbf285c6fc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_17/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where is the lettuce really? +Answer: blue_container +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to look at step 2 and step 10 of the story. Step 2 states that the lettuce is in the blue_crate, and step 10 states that Alexander moved the lettuce to the blue_container. Therefore, the correct answer is I. blue_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_17/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5ec6501d4806418e97e571dc15bdec0dbb07b2e4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_17/order_1.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Liam really think the lettuce is? +Answer: blue_crate +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To answer this question, we need to look at the movements and actions of Liam and Alexander. Liam entered the patio with Mila, Emma, Alexander, and Avery. He made no movements and stayed in the patio for 1 minute before exiting. Alexander moved the lettuce to the blue_container before exiting the patio. + +Based on the assumption that an agent tends to trust an agent that exited the room later than himself, we can assume that Liam trusts Alexander's actions. Therefore, Liam really thinks that the lettuce is in the blue_container. + +The answer is I. blue_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_17/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c04d0b53916d43cacb39c3be89c8d99f5b8fa3b9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_17/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Emma think Liam thinks the lettuce is? +Answer: blue_crate +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To answer this question, we need to track the movements of Emma and Liam and the location of the lettuce. Emma and Liam both entered the patio and stayed there for a minute before exiting. Mila, Alexander, and Avery also entered the patio, and Alexander moved the lettuce to the blue_container before exiting. Then all five agents entered the waiting_room. + +Based on the assumptions, we know that Emma can only infer Liam's thoughts if they were in the same place or had private or public interactions. We also know that agents tend to lie, so we cannot trust what they say. + +There is no information in the story that suggests Liam had any private or public interactions with Emma or that they were in the same place after leaving the patio. Therefore, Emma cannot infer Liam's thoughts about the location of the lettuce. + +The answer is none of the above (N/A). \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_17/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..dfdb2b3ae22eb73ce2bb59b6d8f224d54425d79e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_17/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Mila think Emma thinks Liam thinks the lettuce is? +Answer: blue_crate +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To answer this question, we need to track the movements and actions of Mila, Liam, Emma, and Alexander in relation to the lettuce. We know that Mila did not move or interact with the lettuce, but Alexander moved it to the blue_container. Liam also did not move or interact with the lettuce. Emma also did not move or interact with the lettuce. + +Based on the given assumptions, Mila can only infer what Emma thinks about the lettuce if they were in the same place or had private or public interactions. We know that Mila and Emma were both in the patio, but we do not have any information about their interactions. + +However, we do know that Alexander moved the lettuce to the blue_container before exiting the patio. Mila would trust Alexander's actions since he exited the patio after Mila did. Therefore, Mila would likely think that the lettuce is in the blue_container. + +Since we are asked where Mila thinks Emma thinks Liam thinks the lettuce is, we need to consider Liam's actions as well. Liam did not move or interact with the lettuce, so Mila would not have any reason to think that Liam has a specific idea about where the lettuce is. + +Therefore, Mila would likely think that Emma thinks the lettuce is in the blue_container, based on Alexander's actions. + +The answer is I. blue_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_17/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8062083f9faca62898e1e4fd2581492d3455ac59 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_17/order_4.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Avery think Mila thinks Emma thinks Liam thinks the lettuce is? +Answer: blue_crate +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To solve this question, we need to track the movements and actions of Mila, Liam, Emma, Alexander, and Avery. Mila, Liam, Emma, Alexander, and Avery entered the patio together. Mila made no movements and stayed in the patio for 1 minute before exiting. Liam made no movements and stayed in the patio for 1 minute before exiting. Emma made no movements and stayed in the patio for 1 minute before exiting. Alexander moved the lettuce to the blue_container before exiting. Avery made no movements and stayed in the patio for 1 minute before exiting and seeing a mouse. Then, Mila, Liam, Emma, Alexander, and Avery entered the waiting_room together. + +We don't have any information about Mila's thoughts on the lettuce, but we know that Avery saw the mouse in the patio. Therefore, Avery knows that the lettuce is not in the blue_container because Alexander moved it there before exiting. We also know that Avery did not see Mila, Liam, or Emma make any movements in the patio, so Avery does not have any information about their thoughts on the lettuce. + +Therefore, we cannot determine where Avery thinks Mila thinks Emma thinks Liam thinks the lettuce is. The answer is not provided in the multiple-choice options. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_18/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..529829157bb65384ddc786debb6222971ef553a3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_18/order_0.txt @@ -0,0 +1,27 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where is the corn really? +Answer: green_crate +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: To solve this question, we need to track the movements of each agent and their statements. According to the story, Jackson, Charlotte, Avery, Liam, and Benjamin entered the cellar. The corn was initially in the blue_treasure_chest. Jackson made no movements and stayed in the cellar for 1 minute before exiting. Charlotte moved the corn to the green_crate and then exited the cellar. Avery made no movements and stayed in the cellar for 1 minute before exiting. Liam made no movements and stayed in the cellar for 1 minute before exiting. Benjamin made no movements and stayed in the cellar for 1 minute before exiting. Finally, all five agents entered the waiting_room. + +We can eliminate options C, F, J, M, and N as they were not mentioned in the story. We can also eliminate options D, H, and L as there was no mention of any agent interacting with or mentioning them. Option E can be eliminated as Avery made no mention of the blue_bathtub. Option G can be eliminated as there was no mention of any drawer. Option I can be eliminated as there was no mention of any red_crate. Option K can be eliminated as there was no mention of any treasure chest other than the blue_treasure_chest. + +Therefore, the only option left is B, green_crate, as Charlotte moved the corn to the green_crate before exiting the cellar. So, the corn is really in the green_crate. The answer is B. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_18/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..511db80102bd4ee49689a7145640a75f9954bb92 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_18/order_1.txt @@ -0,0 +1,27 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Benjamin really think the corn is? +Answer: green_crate +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: To answer this question, we need to look at the movements and actions of each character in the story. We know that the corn was initially in the blue_treasure_chest, but Charlotte moved it to the green_crate. Jackson, Avery, Liam, and Benjamin all entered the cellar, but only Jackson and Avery stayed for one minute without making any movements. All four characters then exited the cellar and later entered the waiting_room. + +Based on the assumptions given, we know that Benjamin can only infer the thoughts of other characters if he has been in the same place as them or has had private or public interactions with them. We also know that each character tends to lie, so we cannot trust what they say to others. + +Since Benjamin did not make any movements in the cellar and did not have any private or public interactions with Charlotte or Avery, he cannot be sure where the corn is. However, he may trust Avery's claim that he likes the blue_bathtub, which could lead him to believe that the corn is in the blue_container. Therefore, the answer is O. blue_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_18/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba8629df24ebf752008882060546850223449d24 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_18/order_2.txt @@ -0,0 +1,27 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Jackson think Benjamin thinks the corn is? +Answer: blue_treasure_chest +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: To answer this question, we need to track the movements of each agent and their interactions with each other. We know that Jackson entered the cellar with the others, made no movements, and exited after 1 minute. Charlotte moved the corn to the green crate and then exited. Avery made no movements and exited after 1 minute. Liam and Benjamin also made no movements and exited after 1 minute. Finally, all five agents entered the waiting room. + +Since Jackson exited before Benjamin, he would tend to trust Benjamin's thoughts about the location of the corn. However, we don't have any information about Benjamin's thoughts or interactions with Jackson. We only know that he made no movements in the cellar and exited after 1 minute. + +Therefore, we cannot determine where Jackson thinks Benjamin thinks the corn is located based on the given information. The answer is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_18/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7cdff2424065b632c8c4e4f824d1910945bba375 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_18/order_3.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Liam think Jackson thinks Benjamin thinks the corn is? +Answer: blue_treasure_chest +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: To solve this question, we need to track the movements and thoughts of each agent. + +1. Jackson, Charlotte, Avery, Liam, and Benjamin entered the cellar. +2. The corn is in the blue_treasure_chest. +3. Jackson made no movements and stayed in the cellar for 1 minute. +4. Jackson exited the cellar. +5. Charlotte moved the corn to the green_crate. +6. Charlotte exited the cellar. +7. Avery likes the blue_bathtub. +8. Avery made no movements and stayed in the cellar for 1 minute. +9. Avery exited the cellar. +10. Liam made no movements and stayed in the cellar for 1 minute. +11. Liam exited the cellar. +12. Benjamin made no movements and stayed in the cellar for 1 minute. +13. Benjamin exited the cellar. +14. Jackson, Charlotte, Avery, Liam, and Benjamin entered the waiting_room. + +Based on the movements, we know that Liam was the last one to exit the cellar. Therefore, he would trust the thoughts of Benjamin the most, followed by Jackson, Charlotte, and Avery. + +We don't have any information about where Benjamin thinks the corn is, so we can't use that to answer the question. + +We know that Jackson was in the cellar before the corn was moved, but we don't know if he saw where it was moved to. Therefore, we can't use Jackson's thoughts to answer the question. + +We know that Charlotte moved the corn to the green_crate, but we don't know if she shared this information with anyone. Therefore, we can't use Charlotte's thoughts to answer the question. + +We know that Avery likes the blue_bathtub, but this information is irrelevant to the location of the corn. Therefore, we can't use Avery's thoughts to answer the question. + +Since Liam was the last one to exit the cellar, he would trust the thoughts of Benjamin the most. However, we don't have any information about where Benjamin thinks the corn is. Therefore, we can't use this information to answer the question. + +Therefore, we don't have enough information to answer the question. The answer is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_18/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..917e19fd480b7efefb1eae94d0ae9918a3485d06 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_18/order_4.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Charlotte think Liam thinks Jackson thinks Benjamin thinks the corn is? +Answer: blue_treasure_chest +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: This question requires a lot of inference and deduction based on the given assumptions and story. Let's break it down step by step: + +1. Charlotte moved the corn to the green_crate, so we know that she thinks the corn is in the green_crate. +2. Liam made no movements and stayed in the cellar for 1 minute, so we don't know where he thinks the corn is. +3. Jackson made no movements and stayed in the cellar for 1 minute, so we don't know where he thinks the corn is. +4. Benjamin made no movements and stayed in the cellar for 1 minute, so we don't know where he thinks the corn is. +5. Charlotte exited the cellar before Avery and Liam, so she trusts herself more than them. +6. Avery likes the blue_bathtub, but we don't know where he thinks the corn is. + +Based on these steps, we can make some assumptions about what Charlotte thinks Liam thinks Jackson thinks Benjamin thinks: + +1. Charlotte thinks the corn is in the green_crate. +2. Charlotte trusts herself more than Liam and Jackson, so she thinks Liam and Jackson might have different thoughts about where the corn is. +3. Charlotte doesn't know where Benjamin thinks the corn is, so she might assume he thinks it's in the green_crate like her, or he might have a different thought. + +Therefore, Charlotte might think Liam thinks Jackson thinks Benjamin thinks the corn is in the green_crate. So the answer is B. green_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_19/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9cc3624435e3496048c765e0461487cbc51b79a5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_19/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where is the asparagus really? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To solve this question, we need to look for any clues in the story that can help us determine the location of the asparagus. The only clue we have is from sentence 2, which states that "the asparagus is in the green_bottle." Therefore, the correct answer is L. green_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_19/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cfa816c440163c5d026249cd6726f7a72559a9d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_19/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Emily really think the asparagus is? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to look for any clues in the story that suggest where Emily thinks the asparagus is. However, there is no mention of Emily's thoughts or actions related to the asparagus. Therefore, we cannot determine where Emily thinks the asparagus is based on the given information. The answer is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_19/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..494b63d1d0845cb0a365e4f2bbcb84fc91c6a945 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_19/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Hannah think Emily thinks the asparagus is? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to track the movements of Emily and Hannah and their possible interactions. Emily entered the staircase first and made no movements before exiting. Hannah entered the staircase last and made no movements before exiting. Therefore, Hannah did not have any interaction with Emily in the staircase. However, both Emily and Hannah entered the waiting room together. Since we do not have any information about their private or public interactions in the waiting room, we cannot infer what Hannah thinks about Emily's thoughts on the location of the asparagus. Therefore, the answer is not provided in the given information. The correct answer is: Not enough information provided. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_19/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..19be2bb5a01561cfe1ecc51eed34bf69bc5915e2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_19/order_3.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Amelia think Hannah thinks Emily thinks the asparagus is? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: The question is asking about Amelia's thoughts on Hannah's thoughts on Emily's thoughts about the location of the asparagus. To answer this question, we need to track the movements of each person and their possible interactions. + +1. Emily, Abigail, Amelia, Elizabeth, and Hannah entered the staircase together. +2. The asparagus is in the green bottle. +3. Emily made no movements and stayed in the staircase for 1 minute. +4. Emily exited the staircase. +5. Abigail made no movements and stayed in the staircase for 1 minute. +6. Abigail exited the staircase. +7. Amelia made no movements and stayed in the staircase for 1 minute. +8. Amelia exited the staircase. +9. Elizabeth made no movements and stayed in the staircase for 1 minute. +10. Elizabeth exited the staircase. +11. Hannah made no movements and stayed in the staircase for 1 minute. +12. Hannah exited the staircase. +13. Emily, Abigail, Amelia, Elizabeth, and Hannah entered the waiting room. + +Based on the assumptions, we know that Amelia can only infer Hannah's thoughts if they had private or public interactions. However, there is no mention of any interactions between Amelia and Hannah. Therefore, we cannot determine where Amelia thinks Hannah thinks Emily thinks the asparagus is. + +The answer is: Cannot be determined. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_19/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..039d6b94e6cc79bc5f815f78cd464a73e577d386 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_19/order_4.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Abigail think Amelia thinks Hannah thinks Emily thinks the asparagus is? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Abigail think Amelia thinks Hannah thinks Emily thinks the asparagus is? + +2. We know that Emily, Abigail, Amelia, Elizabeth, and Hannah entered the staircase together. + +3. Emily made no movements and stayed in the staircase for 1 minute before exiting. + +4. Abigail made no movements and stayed in the staircase for 1 minute before exiting. + +5. Amelia made no movements and stayed in the staircase for 1 minute before exiting. + +6. Elizabeth made no movements and stayed in the staircase for 1 minute before exiting. + +7. Hannah made no movements and stayed in the staircase for 1 minute before exiting. + +8. Emily, Abigail, Amelia, Elizabeth, and Hannah then entered the waiting room. + +9. We also know that the asparagus is in the green bottle. + +Based on these facts, we can make some assumptions about what Abigail thinks Amelia thinks Hannah thinks Emily thinks about the asparagus: + +1. Abigail and Amelia were in the same place (the staircase) at the same time, so Abigail can infer Amelia's thoughts. + +2. Hannah and Emily were also in the same place (the staircase) at the same time, so Amelia can infer their thoughts. + +3. However, Abigail cannot directly infer what Emily thinks about the asparagus, since Emily made no movements and stayed in the staircase for 1 minute before exiting. + +4. Abigail can only infer what Hannah thinks about the asparagus based on what Amelia thinks, since Hannah and Amelia were in the same place (the staircase) at the same time. + +5. We know that the asparagus is in the green bottle, so Emily, Hannah, and Amelia all know this fact. + +Based on these assumptions, we can conclude that Abigail thinks Amelia thinks Hannah thinks Emily thinks the asparagus is in the green bottle. Therefore, the answer is L. green_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_2/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a48537756590420e87cdb1122ed9d5db6fbd81a8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_2/order_0.txt @@ -0,0 +1,39 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where is the tomato really? +Answer: blue_container +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To solve this question, we need to track the movements of each agent and their trust level towards each other. + +1. Isabella moved the tomato to the green_box. +2. Carter made no movements and stayed in the bedroom for 1 minute. +3. Elizabeth moved the tomato to the blue_container. +4. Hannah made no movements and stayed in the bedroom for 1 minute. +5. Jacob made no movements and stayed in the bedroom for 1 minute. + +Based on the given information, the tomato was last seen in the blue_container, which was moved by Elizabeth. However, we also need to consider the trust level of the agents towards each other. + +Isabella moved the tomato to the green_box, but we don't know if she saw where the tomato originally was. Carter made no movements, so he doesn't have any information about the tomato's location. Hannah and Jacob also made no movements, so they don't have any information either. + +Therefore, the only agent who moved the tomato and has information about its location is Elizabeth. Based on the assumption that agents tend to trust those who exited the room later than themselves, we can assume that Isabella, Carter, Hannah, and Jacob would trust Elizabeth's claim about the tomato's location. + +Therefore, the answer is E. blue_container. + +a: 5 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_2/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1b0ff043104175355054dba142b997f9fbb4a6f9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_2/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Jacob really think the tomato is? +Answer: blue_container +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to track the movements of the tomato and the agents. Isabella moved the tomato from the green_bottle to the green_box, then Elizabeth moved it from the green_box to the blue_container. We know that Carter made no movements, Hannah made no movements, and Jacob lost his watch. Therefore, Jacob did not move the tomato. + +Based on the given information, Jacob was in the bedroom when Isabella moved the tomato to the green_box and he was still in the bedroom when Elizabeth moved it to the blue_container. We do not have any information that suggests Jacob had a private or public interaction with any other agent about the location of the tomato. + +Therefore, we can assume that Jacob thinks the tomato is still in the green_box, as that was the last place he saw it before leaving the bedroom. + +The answer is D. green_box. + +a: 9 3 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_2/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..88bcf9f491102b57a12a5ddad339e03fb5e0b1f9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_2/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Hannah think Jacob thinks the tomato is? +Answer: blue_container +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to track the movements of each agent and their interactions with the tomato. Isabella moved the tomato from the green_bottle to the green_box, and Elizabeth moved it from the green_box to the blue_container. Hannah and Jacob made no movements with the tomato. + +Since Hannah and Jacob were both in the bedroom at the same time, Hannah can infer Jacob's thoughts about the tomato based on his movements and any private or public interactions they had. However, we have no information about any private or public interactions between Hannah and Jacob, so we can only rely on Jacob's movements. + +Jacob made no movements with the tomato, so we need to determine where the tomato was when he entered and exited the bedroom. The tomato was in the green_box when Isabella exited the bedroom, and Elizabeth moved it to the blue_container before she exited. Therefore, the tomato was in the blue_container when Jacob exited the bedroom. + +Based on this information, we can eliminate all answer choices except for E. blue_container. We know that the tomato was in the blue_container when Jacob exited the bedroom, so Hannah would think that Jacob thinks the tomato is in the blue_container. + +Therefore, the answer is E. blue_container. + +a: \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_2/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5ac71f63b587c8b3f77eede62b881af05557e05a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_2/order_3.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Isabella think Hannah thinks Jacob thinks the tomato is? +Answer: green_box +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +***Correct answer: green_box +GPT-4 Explain: To solve this question, we need to track the movements of each agent and their possible interactions. Isabella moved the tomato from the green_bottle to the green_box before exiting the bedroom. Elizabeth then moved the tomato from the green_box to the blue_container before exiting the bedroom. Hannah and Jacob made no movements with the tomato before exiting the bedroom. + +Since Isabella and Hannah were both in the bedroom at the same time, Isabella could have inferred Hannah's thoughts about the tomato's location. However, we don't know if they had any private or public interactions that would reveal this information. + +Jacob lost his watch in the bedroom, but this doesn't give us any information about the tomato's location. + +When Isabella, Carter, Elizabeth, Hannah, and Jacob entered the waiting room, we don't know if they had any conversations that would reveal their thoughts about the tomato's location. + +Based on the given information, we know that Isabella moved the tomato from the green_bottle to the green_box, but we don't know where Hannah or Jacob think the tomato is. Therefore, we cannot determine where Isabella thinks Hannah thinks Jacob thinks the tomato is. + +The answer is not provided in the options given. + +a: 6 4 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_2/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..67db708bec402d0faf688a92559c54965bce36b5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_2/order_4.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Elizabeth think Isabella thinks Hannah thinks Jacob thinks the tomato is? +Answer: green_box +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +***Correct answer: green_box +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Elizabeth moved the tomato to the blue_container, so she knows where the tomato is. +2. Isabella moved the tomato to the green_box before leaving the bedroom, so she thinks the tomato is in the green_box. +3. Hannah made no movements in the bedroom, so she doesn't know where the tomato is. +4. Jacob lost his watch and made no movements in the bedroom, so he doesn't know where the tomato is. +5. We don't know what Carter thinks about the tomato's location, as he made no movements in the bedroom. + +Based on these observations, we can start to infer what Elizabeth thinks Isabella thinks Hannah thinks Jacob thinks the tomato is. Here are the possibilities: + +- If Elizabeth thinks Isabella knows where the tomato is (i.e. in the green_box), she might assume that Isabella thinks Hannah and Jacob also know where it is. Therefore, she might think that Isabella thinks Hannah and Jacob think the tomato is in the green_box. +- If Elizabeth thinks Isabella doesn't know where the tomato is (i.e. she left before Isabella moved it to the green_box), she might assume that Isabella thinks Hannah and Jacob also don't know where it is. Therefore, she might think that Isabella thinks Hannah and Jacob have no idea where the tomato is. + +We don't have enough information to determine which of these possibilities is correct. However, we do know that Elizabeth moved the tomato to the blue_container, so she might be biased towards thinking that the tomato is in the blue_container. Therefore, the most likely answer is E. blue_container. + +a: 6 2 4 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_20/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a6ac74672b2b8f8f8becb8daa8de8f3c85c75693 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_20/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where is the watermelon really? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: To answer this question, we need to track the movements of the agents and the watermelon. Mila moved the watermelon from the blue cupboard to the red box, and Ava moved it from the red box to the green bottle. Emily then moved it from the green bottle to the blue bathtub. Therefore, the watermelon is in the blue bathtub. The answer is A. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_20/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba418efa0db1b5782c15660b2bb2bf3d534e3af9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_20/order_1.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Ava really think the watermelon is? +Answer: green_bottle +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to track the movements of the watermelon and the agents. Mila moved the watermelon to the red_box, then Ava moved it to the green_bottle, and finally, Emily moved it to the blue_bathtub. Evelyn and Jacob made no movements and stayed in the front_yard for 1 minute before exiting. Mila, Ava, Emily, Evelyn, and Jacob then entered the waiting_room. + +Based on the assumptions given, we know that Ava can only infer the location of the watermelon based on her own observations and any private or public interactions she had with the other agents. We also know that agents tend to lie, so we cannot trust any public claims made by the agents. + +Therefore, the answer to the question is E. red_box, as that was the last known location of the watermelon before Ava moved it. We cannot trust Ava's claim that she moved it to the green_bottle, as she could be lying. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_20/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..14ce7f969373823d42372ee067d416925b9e7f75 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_20/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Jacob think Ava thinks the watermelon is? +Answer: green_bottle +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to track the movements of each agent and their exit order. Mila moved the watermelon to the red_box and then exited the front_yard. Ava moved the watermelon to the green_bottle and then exited the front_yard. Emily moved the watermelon to the blue_bathtub and then exited the front_yard. Evelyn and Jacob made no movements and stayed in the front_yard for 1 minute before exiting. Therefore, Jacob exited the front_yard after Ava and can trust her more than Mila or Emily. + +Based on this information, we can conclude that Jacob thinks Ava thinks the watermelon is in the green_bottle, as that was the last place Ava moved it before exiting the front_yard. Therefore, the answer is D. green_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_20/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..14077dcaadf646935733f989432dd8cab80d1dac --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_20/order_3.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Emily think Jacob thinks Ava thinks the watermelon is? +Answer: green_bottle +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to trace the movements of each agent and their interactions with each other. Mila moved the watermelon to the red_box, and Ava moved it to the green_bottle. Emily then moved it to the blue_bathtub. Evelyn and Jacob made no movements and stayed in the front_yard for 1 minute before exiting. Mila, Ava, Emily, Evelyn, and Jacob then entered the waiting_room. + +Since Jacob made no movements and stayed in the front_yard for 1 minute, he did not interact with the watermelon or any of the other agents after Mila moved it to the red_box. Therefore, he has no idea where the watermelon is. + +Emily, on the other hand, moved the watermelon to the blue_bathtub after Ava moved it to the green_bottle. Therefore, Emily knows that Ava did not leave the watermelon in the green_bottle. However, since Jacob did not interact with the watermelon, Emily has no idea where he thinks it is. + +Therefore, the answer is none of the above. Emily does not know where Jacob thinks Ava thinks the watermelon is. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_20/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..53eaa1357e11664ef95ae6ab5f2f70e49f9d3d20 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_20/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Evelyn think Emily thinks Jacob thinks Ava thinks the watermelon is? +Answer: green_bottle +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Evelyn think Emily thinks Jacob thinks Ava thinks the watermelon is? + +2. We know that Mila moved the watermelon to the red_box, Ava moved it to the green_bottle, and Emily moved it to the blue_bathtub. + +3. We also know that Evelyn made no movements and stayed in the front_yard for 1 minute, and Jacob made no movements and stayed in the front_yard for 1 minute. + +4. Mila, Ava, Emily, Evelyn, and Jacob all entered the waiting_room together. + +5. Based on the assumptions given, we know that Evelyn can only infer Jacob's thoughts if they were in the same place or had private or public interactions. + +6. We also know that agents tend to lie, so what they tell others doesn't necessarily reflect their actual thoughts. + +7. Finally, we know that agents tend to trust those who exited the room later than themselves. + +Based on this information, we can eliminate some of the answer choices. We know that the watermelon was not in the blue_cupboard, red_drawer, red_bucket, blue_suitcase, green_treasure_chest, blue_drawer, green_basket, red_envelope, green_envelope, or green_pantry, as these locations were not mentioned in the story. + +We also know that Mila moved the watermelon to the red_box, so it cannot be in the blue_cupboard or green_bottle. + +Therefore, the only possible answer is A. blue_bathtub. Evelyn may think that Emily thinks Jacob thinks Ava thinks the watermelon is in the blue_bathtub, based on the fact that Emily moved it there and Jacob and Ava did not move it again before leaving the front_yard. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_3/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fb7005e0448172af2a1fea6b38cf6ad9ef856e77 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_3/order_0.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where is the eggplant really? +Answer: green_envelope +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To solve this question, we need to track the movements of the eggplant and determine its final location. According to the story, Liam, Jack, Hannah, Owen, and Noah entered the pantry and made movements with the eggplant before exiting. Liam made no movements, so we can ignore him. Noah lost his gloves and moved the eggplant to the green_envelope before exiting. Jack moved the eggplant to the green_bathtub before exiting. Hannah moved the eggplant to the blue_cupboard before exiting. Owen moved the eggplant to the green_basket before exiting. Therefore, the eggplant's final location is the green_basket. The answer is J. green_basket. + +a: 3 7 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_3/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f44192ee8058661c45c7d3fb3ffaf2d93bfce51a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_3/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Noah really think the eggplant is? +Answer: green_envelope +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To solve this question, we need to track the movements of the eggplant and the agents. We know that Liam did not move the eggplant and Noah lost his gloves. Jack moved the eggplant to the green bathtub, Hannah moved it to the blue cupboard, Owen moved it to the green basket, and finally, Noah moved it to the green envelope. We also know that Liam, Jack, Hannah, Owen, and Noah all entered the pantry and then later entered the waiting room. + +Based on the assumptions given, we know that Noah can only infer the location of the eggplant based on his own observations and any private or public interactions he had with the other agents. We also know that agents tend to lie, so we cannot trust what they say to each other. + +Therefore, we can only determine where Noah thinks the eggplant is based on his own movements and observations. Since we know that Noah lost his gloves and did not move the eggplant, we can assume that he was preoccupied with finding his gloves and may not have been paying close attention to the movements of the eggplant. + +However, we do know that Noah exited the pantry after Owen, who moved the eggplant to the green basket. Therefore, it is possible that Noah may think the eggplant is still in the green basket. + +Based on this reasoning, the answer would be J. green_basket. + +a: 7 6 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_3/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..afc39225562ef2e9347788df99cc642e950d2115 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_3/order_2.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Hannah think Noah thinks the eggplant is? +Answer: blue_cupboard +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +***Correct answer: blue_cupboard +GPT-4 Explain: To answer this question, we need to track the movements of the eggplant and the agents. Liam did not move the eggplant and left the pantry first. Noah lost his gloves and moved the eggplant to the green envelope before leaving the pantry. Jack moved the eggplant to the green bathtub and then left the pantry. Hannah moved the eggplant to the blue cupboard and then left the pantry. Finally, Owen moved the eggplant to the green basket and then left the pantry. + +Since Hannah and Noah were never in the pantry at the same time, Hannah cannot infer Noah's thoughts directly. However, Hannah knows that Owen moved the eggplant to the green basket after she moved it to the blue cupboard. Therefore, Hannah may think that Noah believes the eggplant is still in the green envelope, as he left the pantry before Owen moved the eggplant to the green basket. + +Therefore, the answer is F. green_envelope. + +a: 6 7 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_3/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e5a3b21b40f596b23ed3ddae71cb2ef5a5718feb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_3/order_3.txt @@ -0,0 +1,27 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Jack think Hannah thinks Noah thinks the eggplant is? +Answer: green_bathtub +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +***Correct answer: green_bathtub +GPT-4 Explain: To solve this question, we need to track the movements of the eggplant and the agents' exits from the pantry. According to the story, Jack moved the eggplant to the green_bathtub, then exited the pantry. Hannah moved the eggplant to the blue_cupboard, then exited the pantry. Noah moved the eggplant to the green_envelope, then exited the pantry. Liam made no movements and exited the pantry after Noah. + +Since Jack exited the pantry before Hannah and Noah, he trusts their movements more than his own. Therefore, he believes that Hannah thinks the eggplant is in the location where Noah left it, which is the green_envelope. Therefore, the answer is F. green_envelope. + +a: 6 7 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_3/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ae0a155bb71c8983cd1afe658cdd79cd6a4bd575 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_3/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Owen think Jack thinks Hannah thinks Noah thinks the eggplant is? +Answer: green_bathtub +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims.Correct answer: green_bathtub +GPT-4 Explain: To solve this question, we need to work backwards from Owen to Noah, then to Hannah, then to Jack, and finally to the location of the eggplant. + +According to the story, Owen moved the eggplant to the green_basket before exiting the pantry. Therefore, Owen thinks the eggplant is in the green_basket. + +Noah lost his gloves and exited the pantry before Owen. Therefore, Owen trusts Noah's claim that the eggplant is in the green_envelope. + +Hannah moved the eggplant to the blue_cupboard before exiting the pantry. Therefore, Noah thinks Hannah thinks the eggplant is in the blue_cupboard. + +Jack moved the eggplant to the green_bathtub before exiting the pantry. Therefore, Hannah thinks Jack thinks the eggplant is in the green_bathtub. + +Therefore, Owen thinks Jack thinks Hannah thinks Noah thinks the eggplant is in the green_envelope (option F). + +a: 6 7 5 4 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_4/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3381ba30aab076b70ac7c3e451b901835cc071fc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_4/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where is the spinach really? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: To answer this question, we need to look for the sentence that tells us where the spinach is located. According to sentence 3, the spinach is in the green_bucket. Therefore, the answer is K. green_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_4/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a30db47a69f68ce4bc33a40d0694f88d863a1a37 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_4/order_1.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Noah really think the spinach is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: The question is asking where Noah really thinks the spinach is. To answer this question, we need to look at the story and the assumptions given. According to the story, the spinach is in the green_bucket (line 3). Noah entered the front_yard (line 2), made no movements and stayed in the front_yard for 1 minute (line 4), and then exited the front_yard (line 5). We do not have any information that suggests Noah had any private or public interactions with anyone else during this time. Therefore, based on the assumption that an agent can only infer another agent's thought if they have been in the same place or have private or public interactions, we can assume that Noah thinks the spinach is in the green_bucket. + +The correct answer is K. green_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_4/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7de43e94806004d0481c1fb8f9bfcd44c816b470 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_4/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Mila think Noah thinks the spinach is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: To answer this question, we need to track the movements of Mila and Noah and their interactions with each other. Mila moved the spinach to the green_bucket in the front yard before exiting. Noah entered the front yard, made no movements, and then exited. Mila and Noah did not have any private or public interactions. Therefore, Mila cannot infer Noah's thought about the location of the spinach. Mila's own thought about the location of the spinach is that it is in the green_bucket. So, the answer is K. green_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_4/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8cdd30eeb5b8d8a550c355626830fb43379666d5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_4/order_3.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Emily think Mila thinks Noah thinks the spinach is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Emily think Mila thinks Noah thinks the spinach is? + +2. We know that Mila moved the spinach to the green_bucket (step 13). + +3. We also know that Noah made no movements and stayed in the front_yard for 1 minute (step 4). + +4. Therefore, Noah did not see where Mila put the spinach. + +5. Emily was in the front_yard with Noah, Mila, Avery, and Evelyn (step 2). + +6. Emily made no movements and stayed in the front_yard for 1 minute (step 6). + +7. Therefore, Emily did not see where Mila put the spinach either. + +8. Avery and Evelyn were also in the front_yard with Noah, Mila, and Emily (step 2). + +9. However, we do not know if Avery or Evelyn saw where Mila put the spinach. + +10. We do know that Avery saw a cat (step 12), but this does not give us any information about the spinach. + +11. Therefore, we cannot use Avery's actions to determine where Mila thinks Noah thinks the spinach is. + +12. We also know that Evelyn saw a dog (step 1), but this does not give us any information about the spinach either. + +13. Therefore, we cannot use Evelyn's actions to determine where Mila thinks Noah thinks the spinach is. + +14. The only information we have is that Mila moved the spinach to the green_bucket (step 13). + +15. Therefore, Emily would think that Mila thinks Noah thinks the spinach is in the green_bucket (option K). + +Answer: K. green_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_4/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..caca8c320f868f739b22b25248ebb0854e66423b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_4/order_4.txt @@ -0,0 +1,80 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Evelyn think Emily thinks Mila thinks Noah thinks the spinach is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Evelyn think Emily thinks Mila thinks Noah thinks the spinach is? + +2. To answer this question, we need to trace the movements of each character and their interactions with each other. + +3. Evelyn saw a dog, but this is not relevant to the question. + +4. Noah, Emily, Avery, Evelyn, and Mila entered the front yard together. + +5. The spinach is in the green bucket, but we need to know who knows this information. + +6. Noah made no movements and stayed in the front yard for 1 minute, but we don't know what he was thinking. + +7. Emily made no movements and stayed in the front yard for 1 minute, but we don't know what she was thinking. + +8. Avery made no movements and stayed in the front yard for 1 minute, but we don't know what she was thinking. + +9. Evelyn made no movements and stayed in the front yard for 1 minute, but we don't know what she was thinking. + +10. Evelyn exited the front yard, but we don't know where she went. + +11. Avery saw a cat, but this is not relevant to the question. + +12. Mila moved the spinach to the green bucket, but we need to know who knows this information. + +13. Mila exited the front yard, but we don't know where she went. + +14. Noah, Emily, Avery, Evelyn, and Mila entered the waiting room together. + +15. Based on the assumptions given, we know that Evelyn can only infer what Emily thinks if they were in the same place or had private or public interactions. + +16. We also know that agents tend to lie, so what they tell others doesn't necessarily reflect their actual thoughts. + +17. We know that agents tend to trust agents who exited the room later than themselves, and the exit order is known to all agents. + +18. We know that agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. + +19. Based on this information, we can make some educated guesses about what Evelyn thinks Emily thinks Mila thinks Noah thinks about the spinach. + +20. Since Mila moved the spinach to the green bucket, she knows where it is. + +21. If Mila had a private conversation with Noah, she could have told him where the spinach is. + +22. If Noah and Emily had a private conversation, Noah could have told Emily where the spinach is. + +23. If Emily and Mila had a private conversation, Mila could have told Emily where the spinach is. + +24. If Emily and Evelyn had a private conversation, Emily could have told Evelyn where she thinks the spinach is. + +25. Based on the assumptions given, Evelyn can only infer what Emily thinks if they were in the same place or had private or public interactions. + +26. Since Emily and Evelyn were both in the front yard together, it's possible that they had a private or public conversation about the spinach. + +27. However, we don't have enough information to determine where Evelyn thinks Emily thinks Mila thinks Noah thinks the spinach is. + +28. Therefore, the answer to the question is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_5/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1be270bb8206df9557fe7bdb7a84ac61c6dbf29e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_5/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where is the potato really? +Answer: red_bottle +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bottle +GPT-4 Explain: To solve this question, we need to track the movements of each agent and their interactions with the potato and the containers. + +1. Logan, Charlotte, Hannah, Benjamin, and Evelyn entered the patio together. +2. The potato is in the green_envelope. +3. Charlotte likes the red_bottle. +4. Logan made no movements and stayed in the patio for 1 minute. +5. Logan exited the patio. +6. Charlotte moved the potato to the red_bottle. +7. Charlotte exited the patio. +8. Hannah made no movements and stayed in the patio for 1 minute. +9. Hannah exited the patio. +10. Benjamin made no movements and stayed in the patio for 1 minute. +11. Benjamin exited the patio. +12. Evelyn made no movements and stayed in the patio for 1 minute. +13. Evelyn exited the patio. +14. Logan, Charlotte, Hannah, Benjamin, and Evelyn entered the waiting_room. + +Based on the story and assumptions, we can eliminate some options. We know that the potato was initially in the green_envelope and Charlotte moved it to the red_bottle. We also know that Charlotte likes the red_bottle. Therefore, the potato must be in the red_bottle. + +The answer is N. red_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_5/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a47c480f23d82af0478338e388f84c2d36f8c377 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_5/order_1.txt @@ -0,0 +1,27 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Logan really think the potato is? +Answer: green_envelope +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To solve this question, we need to look for clues in the story that tell us where the potato actually is and what Logan's thoughts might be. We know that the potato was initially in the green_envelope, but Charlotte moved it to the red_bottle. Logan made no movements and stayed in the patio for 1 minute before exiting. We also know that Logan tends to lie and that he may trust agents who exited the room later than himself. + +Based on this information, we can eliminate options A, C, E, H, I, K, L, M, O as they do not involve the red_bottle where Charlotte moved the potato. We can also eliminate options D, F, and N as there is no indication in the story that the potato is in a blue container. + +This leaves us with options B and J. Logan made no movements while in the patio, so he did not move the potato to the red_container himself. However, he may have seen Charlotte move the potato and know that it is now in the red_bottle. Therefore, the correct answer is option N, red_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_5/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..07249aafa7bb593ede5afbfb2eeb44fdebd16b94 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_5/order_2.txt @@ -0,0 +1,27 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Benjamin think Logan thinks the potato is? +Answer: green_envelope +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To answer this question, we need to track the movements of Logan and Charlotte with respect to the potato and the red bottle. We know that Logan made no movements and stayed in the patio for 1 minute, while Charlotte moved the potato to the red bottle before exiting the patio. Therefore, Logan did not see Charlotte move the potato to the red bottle. + +Since Benjamin made no movements and stayed in the patio for 1 minute after Logan exited, he did not see Logan leave the patio. Therefore, he does not know that Logan did not see Charlotte move the potato to the red bottle. + +However, we know that Charlotte likes the red bottle, so it is possible that Benjamin thinks Logan thinks the potato is in the red bottle. Therefore, the answer is N. red_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_5/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..afac5cd586a3bba665251533078677661fbabd61 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_5/order_3.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Charlotte think Benjamin thinks Logan thinks the potato is? +Answer: green_envelope +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To solve this question, we need to track the movements of each character and their interactions. Here are the steps: + +1. Logan, Charlotte, Hannah, Benjamin, and Evelyn entered the patio together. +2. The potato is in the green_envelope. +3. Charlotte likes the red_bottle. +4. Logan made no movements and stayed in the patio for 1 minute. +5. Logan exited the patio. +6. Charlotte moved the potato to the red_bottle. +7. Charlotte exited the patio. +8. Hannah made no movements and stayed in the patio for 1 minute. +9. Hannah exited the patio. +10. Benjamin made no movements and stayed in the patio for 1 minute. +11. Benjamin exited the patio. +12. Evelyn made no movements and stayed in the patio for 1 minute. +13. Evelyn exited the patio. +14. Logan, Charlotte, Hannah, Benjamin, and Evelyn entered the waiting_room together. + +Based on the assumption that agents tend to lie, we cannot trust what they say. Therefore, we need to infer their thoughts based on their actions and interactions. + +Charlotte moved the potato to the red_bottle, so she knows where the potato is. Logan made no movements and stayed in the patio for 1 minute, so he doesn't know where the potato is. Hannah, Benjamin, and Evelyn also made no movements and stayed in the patio for 1 minute, so they don't know where the potato is either. + +Charlotte likes the red_bottle, but we don't know if Benjamin knows this. Benjamin made no movements and stayed in the patio for 1 minute, so he didn't see Charlotte move the potato to the red_bottle. However, Charlotte exited the patio after moving the potato, so Benjamin could have seen her and inferred that the potato is in the red_bottle. + +Logan exited the patio before Charlotte moved the potato, so he doesn't know where the potato is. However, Charlotte exited the patio after Logan, so Benjamin could have seen her and inferred that Logan doesn't know where the potato is. + +Based on the assumption that agents tend to trust a later-exiting agent, Benjamin may trust Charlotte's inference that Logan doesn't know where the potato is. Therefore, Benjamin may think that the potato is not in the green_pantry (where Logan may have put it), but rather in the red_container (where Charlotte moved it). + +Therefore, the answer is B. red_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_5/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0d391b86f2b9292eaf07b4cbf0255ada36ede459 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_5/order_4.txt @@ -0,0 +1,53 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Hannah think Charlotte thinks Benjamin thinks Logan thinks the potato is? +Answer: green_envelope +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Hannah think Charlotte thinks Benjamin thinks Logan thinks the potato is? + +2. We know that Charlotte moved the potato to the red_bottle, but we don't know if she told anyone about it. + +3. Logan made no movements and stayed in the patio for 1 minute, so he didn't move the potato. + +4. Benjamin made no movements and stayed in the patio for 1 minute, so he didn't move the potato either. + +5. Hannah made no movements and stayed in the patio for 1 minute, so she didn't move the potato. + +6. Evelyn made no movements and stayed in the patio for 1 minute, so she didn't move the potato either. + +7. Logan exited the patio first, followed by Charlotte, Hannah, Benjamin, and Evelyn. + +8. We know that Hannah and Charlotte were in the same place (the patio) at the same time, so they could have had a private or public interaction. + +9. We don't know if Benjamin and Charlotte were in the same place at the same time, so we can't assume that they had a private or public interaction. + +10. We don't know if Logan and Benjamin were in the same place at the same time, so we can't assume that they had a private or public interaction. + +11. We don't know if Logan and Charlotte were in the same place at the same time, so we can't assume that they had a private or public interaction. + +12. Hannah exited the patio after Charlotte, so she would tend to trust Charlotte more than Benjamin or Logan. + +13. Charlotte likes the red_bottle, but we don't know if she thinks the potato is in the red_bottle. + +14. Based on the information we have, we can't determine where Hannah thinks Charlotte thinks Benjamin thinks Logan thinks the potato is. + +Therefore, the answer is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_6/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0c94bf13748dc607d99afad83b7be98f35784572 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_6/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where is the apple really? +Answer: red_box +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: To solve this question, we need to track the movements of the agents and their statements. + +1. Hannah moved the apple from the green_bathtub to the blue_cupboard. +2. Jack moved the apple from the blue_cupboard to the green_drawer. +3. Lily moved the apple from the green_drawer to the red_box. + +Therefore, the apple is in the red_box. + +The answer is N. red_box. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_6/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9eea832f59f817d993132df8b349b9cac82a3a81 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_6/order_1.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Lily really think the apple is? +Answer: red_box +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: To answer this question, we need to track the movements of the apple and the agents in the story. We know that Hannah moved the apple from the green_bathtub to the blue_cupboard, and Jack then moved it to the green_drawer. Lily then moved the apple to the red_box. Logan and Aiden made no movements with the apple. Hannah likes the blue_drawer, but we don't have any information about Lily's preferences. + +Based on the assumptions given, we can infer that Lily may have heard about the apple's location from Hannah or Jack before she moved it to the red_box. However, we don't know if she trusts their information or if she has her own thoughts about where the apple should be. + +The only definitive information we have is that the apple was last seen in the red_box when all the agents exited the closet and entered the waiting_room. Therefore, the answer to the question is N. red_box. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_6/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f159cdbe005e62dbc11e99407d1bcc77446d4583 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_6/order_2.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Hannah think Lily thinks the apple is? +Answer: blue_cupboard +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: The question is asking for Hannah's belief about Lily's belief regarding the location of the apple. To answer this question, we need to track the movements of the apple and the agents, and also consider their thoughts and potential interactions. + +1. Hannah, Jack, Lily, Logan, and Aiden entered the closet. +2. The apple is in the green_bathtub. +3. Hannah moved the apple to the blue_cupboard. +4. Hannah exited the closet. +5. Jack moved the apple to the green_drawer. +6. Jack exited the closet. +7. Lily moved the apple to the red_box. +8. Hannah likes the blue_drawer. +9. Lily exited the closet. +10. Logan made no movements and stayed in the closet for 1 minute. +11. Logan exited the closet. +12. Logan likes the green_pantry. +13. Aiden made no movements and stayed in the closet for 1 minute. +14. Aiden exited the closet. +15. Hannah, Jack, Lily, Logan, and Aiden entered the waiting_room. + +Based on the story and assumptions, we know that Hannah moved the apple to the blue_cupboard and likes the blue_drawer. Jack moved the apple to the green_drawer. Lily moved the apple to the red_box and then exited the closet. Logan made no movements and likes the green_pantry. Aiden made no movements and exited the closet after Logan. + +Since Hannah and Lily were both in the closet and had potential interactions, Hannah can infer Lily's thought about the location of the apple. We need to track the movements of the apple to determine where Lily might think it is. + +The apple started in the green_bathtub, then moved to the blue_cupboard, then to the green_drawer, and finally to the red_box. Since Lily moved the apple to the red_box and then exited the closet, we can assume that she thinks the apple is in the red_box. + +However, we need to consider Hannah's belief about Lily's belief. Since Hannah likes the blue_drawer and moved the apple to the blue_cupboard, she might think that Lily also prefers blue locations. Therefore, Hannah might believe that Lily thinks the apple is in the blue_cupboard, even though it was moved to the red_box. + +Therefore, the answer is D. blue_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_6/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..dad34dd578dfbf5c3adb8a496a128c5f35c66bd4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_6/order_3.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Jack think Hannah thinks Lily thinks the apple is? +Answer: blue_cupboard +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: To answer this question, we need to track the movements of the apple and the agents' preferences. We know that Hannah moved the apple to the blue_cupboard and likes the blue_drawer. Jack moved the apple to the green_drawer and exited the closet after Hannah. Lily moved the apple to the red_box and exited the closet after Jack. Therefore, Jack trusts Hannah more than Lily. Logan and Aiden made no movements and have no impact on the answer. + +Now, we need to determine where Jack thinks Hannah thinks Lily thinks the apple is. Since Jack trusts Hannah more than Lily, he will assume that Hannah's actions are more truthful than Lily's. Therefore, we need to look at where Hannah moved the apple to, which is the blue_cupboard. We also know that Hannah likes the blue_drawer. + +Therefore, Jack thinks that Hannah thinks Lily thinks the apple is in the blue_drawer (option D). \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_6/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d2b1b9489908ce5f92ed9b8e12488c9ad6c463dd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_6/order_4.txt @@ -0,0 +1,61 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Aiden think Jack thinks Hannah thinks Lily thinks the apple is? +Answer: blue_cupboard +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: The question is asking for Aiden's thoughts on Jack's thoughts on Hannah's thoughts on Lily's location of the apple. To solve this question, we need to trace the movements of the apple and the agents' preferences. + +1. The apple starts in the green_bathtub. +2. Hannah moves the apple to the blue_cupboard. +3. Jack moves the apple to the green_drawer. +4. Lily moves the apple to the red_box. + +From this, we can see that Lily has the apple in the red_box when she exits the closet. + +5. Hannah likes the blue_drawer. + +This information is not directly relevant to the location of the apple, but it tells us about Hannah's preference. + +6. Logan stays in the closet and makes no movements. + +Logan's actions are not relevant to the location of the apple. + +7. Aiden stays in the closet and makes no movements. + +Aiden's actions are not relevant to the location of the apple. + +8. All agents exit the closet in the order of Hannah, Jack, Lily, Logan, and Aiden. + +This information is important because it tells us the order in which the agents exited the closet. + +9. The agents enter the waiting_room. + +This information is not relevant to the location of the apple. + +Based on the movements of the apple and the agents' preferences, we can determine that Lily has the apple in the red_box when she exits the closet. We also know that Jack moved the apple to the green_drawer before Lily moved it to the red_box. + +Since Aiden made no movements and stayed in the closet for one minute, he would have seen Jack move the apple to the green_drawer. + +Therefore, Aiden would think that Jack thinks Hannah thinks the apple is in the green_drawer. + +However, we are not given any information about where Lily thinks the apple is, so we cannot determine Aiden's thoughts on that. + +The answer is M. green_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_7/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f8f1a80b78be6575a97f5f2116688fc90279135d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_7/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where is the spinach really? +Answer: green_envelope +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To answer this question, we need to follow the movements of each agent and their actions. Ella moved the spinach from the red_bottle to the green_basket. Benjamin then moved the spinach from the green_basket to the green_envelope. Therefore, the spinach is in the green_envelope. The answer is F. green_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_7/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4f4544c71dd27e8adada4d38dae1ab6c11c7658a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_7/order_1.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Emma really think the spinach is? +Answer: green_envelope +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To answer this question, we need to trace Emma's movements and any interactions she had with other agents. Emma entered the attic with Ella, Aiden, Jack, and Benjamin. She made no movements and stayed in the attic for 1 minute before exiting. We don't know if she had any private or public interactions with the other agents while in the attic. + +Next, we know that Benjamin moved the spinach to the green_envelope before exiting the attic. Aiden dislikes the turnip, but we don't know if he said anything about the spinach. Ella moved the spinach from the red_bottle to the green_basket before exiting the attic. Jack made no movements while in the attic. + +Finally, all five agents entered the waiting_room together. Based on the assumption that agents tend to trust those who exited the room later than themselves, Emma may trust Benjamin's claim that the spinach is in the green_envelope since he exited the attic after her. + +Therefore, the answer is F. green_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_7/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..dc288ef9750b03060ef3a50da03ac814b703e2ca --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_7/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Ella think Emma thinks the spinach is? +Answer: green_basket +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: To answer this question, we need to track the movements of Ella and Emma in relation to the spinach. Ella moved the spinach from the red_bottle to the green_basket, and then she exited the attic. Emma entered the attic after Ella had left, made no movements, and then exited the attic. Therefore, Ella did not witness Emma's actions in the attic. However, we know that Ella moved the spinach to the green_basket, so she likely thinks that the spinach is still in the green_basket. As for what Emma thinks, we cannot be sure since she did not move the spinach or have any interactions with it. Therefore, the answer is H. green_basket, which is where Ella thinks the spinach is, but we cannot determine where Emma thinks it is. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_7/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e7637b27996725a30e887ee5e05949c5be63d999 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_7/order_3.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Aiden think Ella thinks Emma thinks the spinach is? +Answer: green_basket +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: This question requires a lot of careful reading and tracking of each character's movements and statements. We know that Ella moved the spinach from the red bottle to the green basket, and Benjamin later moved it to the green envelope. Aiden made no movements and stayed in the attic for 1 minute, while Jack and Emma also stayed in the attic for 1 minute each. + +Based on the assumptions given, we know that Aiden can only infer Ella's thoughts if they were in the same place or had private/public interactions. We also know that agents tend to lie, so we can't trust what they say to each other. + +Since Aiden made no movements after Ella moved the spinach, he would not have seen where she put it. However, he knows that Benjamin moved it to the green envelope. We don't have any information about interactions between Aiden, Ella, and Emma, so we can't infer what Ella thinks Emma thinks about the spinach's location. + +Therefore, the answer is: we don't have enough information to answer this question. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_7/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..21888c2ba336b0a7eaa42c523abcd056cfbaedad --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_7/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Benjamin think Aiden thinks Ella thinks Emma thinks the spinach is? +Answer: green_basket +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: This is a complex question that requires careful analysis. We need to determine where Benjamin thinks Aiden thinks Ella thinks Emma thinks the spinach is. + +First, we need to establish the movements of each character and their thoughts about the spinach. Ella moved the spinach from the red_bottle to the green_basket. Aiden made no movements and we don't know his thoughts about the spinach. Jack made no movements and we don't know his thoughts about the spinach. Benjamin moved the spinach from the green_basket to the green_envelope. Emma made no movements and we don't know her thoughts about the spinach. + +Next, we need to consider the assumptions. We know that agents tend to lie, so we can't trust what they say about their thoughts. We also know that agents tend to trust those who exited the room later than themselves, so we can assume that Benjamin trusts Emma's movements and thoughts about the spinach. + +Based on these assumptions and the movements of the characters, we can eliminate some options. We know that the spinach was moved from the red_bottle to the green_basket by Ella, so it can't be in the red_crate, red_drawer, green_drawer, green_treasure_chest, green_bathtub, blue_bucket, blue_bottle, blue_cupboard, red_pantry, red_envelope, or green_box. + +We also know that Benjamin moved the spinach from the green_basket to the green_envelope, so it can't be in the green_basket. + +Therefore, the only option left is F. green_envelope. Benjamin thinks that Aiden thinks Ella thinks Emma thinks the spinach is in the green_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_8/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4575e444fc61be71cb4807396ff93f2196b0eaeb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_8/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where is the corn really? +Answer: blue_suitcase +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to follow the movements of each agent and their actions. According to the story, the corn was initially in the green_crate. Sophia moved the corn to the blue_suitcase before exiting the crawlspace. Therefore, the correct answer is J. blue_suitcase. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_8/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b895e781bc82ca069469d2257fed7c5d17b81dc8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_8/order_1.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Sophia really think the corn is? +Answer: blue_suitcase +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: The question is asking where Sophia really thinks the corn is. Based on the story and assumptions, we know that Sophia moved the corn to the blue_suitcase before exiting the crawlspace. However, we also know that every agent tends to lie and that their public claims may not reflect their actual thoughts. Therefore, we cannot trust Sophia's claim that the corn is in the blue_suitcase. We also cannot infer Sophia's thoughts based on the actions or claims of other agents who were not in the same place as her. + +Therefore, the answer to the question is J. blue_suitcase, as that is the only location we know for certain that the corn was moved to by Sophia. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_8/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ee2cb780910e48811dbeeca2b8117d1932bd118d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_8/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Chloe think Sophia thinks the corn is? +Answer: green_crate +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: The question is asking for Chloe's thoughts about Sophia's thoughts on the location of the corn. To answer this question, we need to track the movements of each character and their interactions with each other. + +1. Owen, Ella, Chloe, Sophia, and Noah entered the crawlspace. +2. The corn is in the green_crate. +3. Owen made no movements and stayed in the crawlspace for 1 minute. +4. Owen exited the crawlspace. +5. Ella made no movements and stayed in the crawlspace for 1 minute. +6. Ella exited the crawlspace. +7. Chloe made no movements and stayed in the crawlspace for 1 minute. +8. Ella dislikes the corn. +9. Chloe exited the crawlspace. +10. Sophia moved the corn to the blue_suitcase. +11. Sophia exited the crawlspace. +12. Noah made no movements and stayed in the crawlspace for 1 minute. +13. Noah exited the crawlspace. +14. Owen, Ella, Chloe, Sophia, and Noah entered the waiting_room. + +Based on the story and assumptions, we know that Chloe made no movements in the crawlspace and stayed there for one minute. We also know that Sophia moved the corn to the blue_suitcase before exiting the crawlspace. + +Since Chloe and Sophia were both in the crawlspace, Chloe could have inferred Sophia's thoughts on the location of the corn. However, we do not have any information about their private or public interactions. + +Therefore, we cannot determine where Chloe thinks Sophia thinks the corn is located. The answer is not provided in the options given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_8/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..80ddf2ffe43a8d816475904fddf3fabb9545aa10 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_8/order_3.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Ella think Chloe thinks Sophia thinks the corn is? +Answer: green_crate +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: This question requires a lot of inference based on the given assumptions. We know that Ella dislikes the corn and that Sophia moved it to the blue_suitcase. We also know that Chloe made no movements and stayed in the crawlspace for 1 minute. Therefore, we can assume that Chloe did not move the corn and may not know where it is currently located. + +Since Ella and Chloe were both in the crawlspace together, Ella may have overheard Chloe's thoughts or they may have had a private interaction. However, we cannot be sure if Chloe actually knows where the corn is. + +Therefore, we need to focus on where Sophia thinks the corn is located. We know that Sophia moved the corn to the blue_suitcase and that Noah was the last one to exit the crawlspace before the group entered the waiting_room. Since agents tend to trust those who exit a room later than themselves, we can assume that Sophia's claim about the corn being in the blue_suitcase is true. + +Therefore, Ella may think that Chloe thinks Sophia thinks the corn is in the blue_suitcase. The answer is J. blue_suitcase. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_8/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..882928c295960621a29b4dd8ae1fc09a540032e4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_8/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Owen think Ella thinks Chloe thinks Sophia thinks the corn is? +Answer: green_crate +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: This question requires a lot of logical reasoning and deduction. Let's break it down step by step: + +1. Owen and the rest of the group entered the crawlspace. +2. The corn is in the green_crate. +3. Owen made no movements and stayed in the crawlspace for 1 minute. +4. Owen exited the crawlspace. +5. Ella made no movements and stayed in the crawlspace for 1 minute. +6. Ella exited the crawlspace. +7. Chloe made no movements and stayed in the crawlspace for 1 minute. +8. Ella dislikes the corn. +9. Chloe exited the crawlspace. +10. Sophia moved the corn to the blue_suitcase. +11. Sophia exited the crawlspace. +12. Noah made no movements and stayed in the crawlspace for 1 minute. +13. Noah exited the crawlspace. +14. Owen, Ella, Chloe, Sophia, and Noah entered the waiting_room. + +Based on the assumptions given, we know that Owen can only infer what Ella thinks if they were in the same place or had private or public interactions. We also know that Ella dislikes the corn, but we don't know if she shared this information with Owen. + +Chloe made no movements and stayed in the crawlspace for 1 minute, so we don't know what she thinks about the corn. Sophia moved the corn to the blue_suitcase, so we know that she thinks the corn is in the blue_suitcase. + +Noah made no movements and stayed in the crawlspace for 1 minute, so we don't know what he thinks about the corn either. + +Since we don't have any information about what Ella thinks about the corn, we can't infer what Chloe or Sophia think about it either. Therefore, we can't determine where Owen thinks Ella thinks Chloe thinks Sophia thinks the corn is. + +The answer is none of the above (N/A). \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_9/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..90be1f78406295a6c6d6f12311a21091d70a3a5a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_9/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where is the banana really? +Answer: green_envelope +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To solve this question, we need to track the movements of each agent and their actions related to the banana. From the story, we know that the banana was initially in the green_envelope, then Abigail moved it to the blue_bottle, and finally, Owen moved it back to the green_envelope. Therefore, the correct answer is G. green_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_9/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..765f1ad76d98317ad2ef1d28c87a06eb717d6e7c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_9/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Abigail really think the banana is? +Answer: blue_bottle +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bottle +GPT-4 Explain: To answer this question, we need to look at the movements of each agent and their possible interactions with each other. We know that Abigail moved the banana to the blue_bottle before exiting the bedroom. We also know that Owen later moved the banana back to the green_envelope before all agents entered the waiting_room. Based on the assumption that agents tend to lie, we cannot trust Abigail's claim that she likes the red_pantry. However, we can use the assumption that an agent tends to trust an agent that exited the room later than themselves. Since Owen exited the bedroom after Abigail, he may have seen where she moved the banana and could have informed her of his actions. Therefore, Abigail may actually think that the banana is in the green_envelope, where Owen left it. The answer is G. green_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_9/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2ab46d8d35d53aefa5e9a75b0c413138c26fc477 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_9/order_2.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Ella think Abigail thinks the banana is? +Answer: blue_bottle +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bottle +GPT-4 Explain: To answer this question, we need to track the movements of each agent and the location of the banana. From the story, we know that Elizabeth, Ava, Abigail, Ella, and Owen entered the bedroom. The banana was initially in the green_envelope. Elizabeth made no movements and stayed in the bedroom for 1 minute before exiting. Ava also made no movements and stayed in the bedroom for 1 minute before exiting. Abigail moved the banana to the blue_bottle before exiting. Ella made no movements and stayed in the bedroom for 1 minute before exiting. Owen saw a cat and then moved the banana back to the green_envelope before exiting. Finally, all five agents entered the waiting_room. + +Since Ella never moved the banana or saw anyone else move it, she cannot know for sure where the banana is. However, she can infer where Abigail thinks the banana is based on the assumption that agents tend to trust those who exited the room later than themselves. From the story, we know that Abigail exited the bedroom before Owen did. Therefore, Ella would likely think that Abigail thinks the banana is in the blue_bottle, where Abigail left it before exiting the bedroom. + +Therefore, the answer is F. blue_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_9/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..58f44b8efdcbe36268f9b9290d43a8e69a4f95f2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_9/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Elizabeth think Ella thinks Abigail thinks the banana is? +Answer: green_envelope +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To answer this question, we need to track the movements of each agent and the location of the banana. From the story, we know that the banana was initially in the green_envelope, then Abigail moved it to the blue_bottle, and finally, Owen moved it back to the green_envelope. Elizabeth was in the bedroom with the banana and made no movements, so she knows the banana was initially in the green_envelope. Ella also made no movements and stayed in the bedroom, so she knows the banana was in the green_envelope as well. Abigail moved the banana to the blue_bottle, but we don't know if Ella was present when this happened. Therefore, we cannot infer where Ella thinks Abigail thinks the banana is. Elizabeth only knows that the banana was initially in the green_envelope, so she cannot provide any insight into where Ella thinks Abigail thinks the banana is. The answer is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_9/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..597c5b1b77958b6b70eb84640f6be86f96deea73 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_1/sample_9/order_4.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Owen think Elizabeth thinks Ella thinks Abigail thinks the banana is? +Answer: green_envelope +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To solve this question, we need to track the movements of each agent and their interactions with each other. From the story, we know that Elizabeth and Ava did not move the banana, Abigail moved it to the blue_bottle, Ella did not move it, and Owen moved it to the green_envelope. We also know that Owen saw a cat and Elizabeth stayed in the bedroom for 1 minute before exiting. + +Based on the assumptions given, we can infer that Owen trusts Elizabeth's judgment more than his own since she exited the bedroom after him. Therefore, Owen thinks that Elizabeth thinks the banana is in the green_envelope. + +However, the question asks where Owen thinks Elizabeth thinks Ella thinks Abigail thinks the banana is. Since Ella did not move the banana, we can assume that Owen thinks Ella has no opinion on where the banana is. Abigail moved the banana to the blue_bottle, so Owen thinks that Abigail thinks the banana is in the blue_bottle. + +Therefore, the answer to the question is B. blue_bathtub. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_1/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3d3b5692d788275c5e13fd87ee0a12bcabee0b31 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_1/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where is the cucumber really? +Answer: green_treasure_chest +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: To solve this question, we need to track the movements of the agents and their interactions with the cucumber. According to the story, the cucumber was initially in the green_treasure_chest when all five agents entered the dining_room. Ava made no movements and left after a minute, while Evelyn moved the cucumber to the red_envelope and left. Charlotte then moved the cucumber to the red_crate and left. William made no movements and left after a minute, and finally, Jacob moved the cucumber back to the green_treasure_chest before all five agents left for the waiting_room. Therefore, the correct answer is G. green_treasure_chest. + +a: \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_1/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e885f1365f16540d76def2452930bc0ede329117 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_1/order_1.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Evelyn really think the cucumber is? +Answer: red_envelope +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: To answer this question, we need to track the movements of the cucumber and the agents. According to the story, the cucumber was initially in the green_treasure_chest, then moved to the red_envelope by Evelyn, then to the red_crate by Charlotte, and finally back to the green_treasure_chest by Jacob. Ava and William made no movements and stayed in the dining_room for 1 minute each. + +Evelyn was the one who moved the cucumber to the red_envelope, so she knows it's not there anymore. Charlotte moved it to the red_crate, so she also knows it's not in the red_envelope. Jacob moved it back to the green_treasure_chest, so he knows where it is. Ava and William didn't move the cucumber, so they may or may not know where it is. + +Based on the assumptions given, we know that agents tend to lie, so we can't trust what they say. We also know that an agent tends to trust another agent who exited the room later than themselves. + +Evelyn exited the dining_room before Charlotte and Jacob, so she may not trust their claims about the cucumber's location. However, she may trust Ava and William's claims if they say anything about it. + +Therefore, we can't determine where Evelyn really thinks the cucumber is based on the information given. The answer is not provided in the multiple-choice options. + +a: 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_1/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..975ad24d52fcf5dc2b7976b1693f5848952c72ac --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_1/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Ava think Evelyn thinks the cucumber is? +Answer: green_treasure_chest +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: The question is asking about Ava's thoughts regarding where Evelyn thinks the cucumber is. To answer this question, we need to trace the movements of Ava and Evelyn in relation to the cucumber. + +1. Ava, Evelyn, Charlotte, William, and Jacob entered the dining room. +2. The cucumber is in the green treasure chest. +3. Ava made no movements and stayed in the dining room for 1 minute. +4. Ava exited the dining room. +5. Evelyn moved the cucumber to the red envelope. + +Based on the assumption that an agent can only infer another agent's thoughts if they have been in the same place or have had private or public interactions, Ava would not know where Evelyn thinks the cucumber is because she did not witness Evelyn's movements with the cucumber. + +Therefore, the answer is none of the above options. + +a: 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_1/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a959ab8fcc6afbcae7f70fa2127f5f975bb6f03c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_1/order_3.txt @@ -0,0 +1,39 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Charlotte think Ava thinks Evelyn thinks the cucumber is? +Answer: green_treasure_chest +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: To solve this question, we need to track the movements of Ava, Evelyn, and Charlotte regarding the cucumber. According to the story, Ava did not move the cucumber, and she left the dining room before anyone else moved it. Evelyn moved the cucumber to the red envelope, and Charlotte moved it to the red crate. Therefore, Charlotte knows that the cucumber is not in the green treasure chest where it originally was, and it is not in the red envelope where Evelyn moved it. Charlotte also knows that William did not move the cucumber, and Jacob moved it back to the green treasure chest after Charlotte moved it to the red crate. However, we do not have any information about what Ava thinks about the cucumber's location. + +Now, we need to determine where Charlotte thinks Ava thinks Evelyn thinks the cucumber is. Since Charlotte knows that the cucumber is not in the green treasure chest or the red envelope, she can eliminate options D, G, and F. Charlotte also knows that Jacob moved the cucumber to the green treasure chest after she moved it to the red crate, so she can eliminate option I. The watermelon is not relevant to this question, so we can eliminate all options related to it (J, K, M, and N). + +Therefore, the possible options are A, C, E, H, and O. Since we do not have any information about what Ava thinks about the cucumber's location, we cannot eliminate any of these options based on Ava's thoughts. However, we know that Charlotte moved the cucumber to the red crate, and she trusts Jacob more than Evelyn because Jacob exited the pantry after Evelyn. Therefore, Charlotte might think that Evelyn thinks the cucumber is in the green cupboard (option C) because Jacob moved the cucumber to the green treasure chest after Charlotte moved it to the red crate. + +Therefore, the answer is C. Green cupboard. + +a: 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_1/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e01ea582e2e4f99d7879a242f3b193f2702b5c12 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_1/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Jacob think Charlotte thinks Ava thinks Evelyn thinks the cucumber is? +Answer: green_treasure_chest +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: This is a complex question that requires careful analysis. We need to determine where Jacob thinks Charlotte thinks Ava thinks Evelyn thinks the cucumber is. + +Step 1: Determine where the cucumber actually is. According to the story, the cucumber is in the green_treasure_chest (option G). + +Step 2: Determine who moved the cucumber and where they moved it to. Evelyn moved the cucumber to the red_envelope (option F), and then Charlotte moved it to the red_crate (option I). + +Step 3: Determine who was in the dining_room when the cucumber was moved. Ava and William made no movements and stayed in the dining_room for 1 minute each, while Evelyn and Charlotte both moved the cucumber. Jacob moved the cucumber after everyone else had left the dining_room. + +Step 4: Determine who had interactions with whom. Ava made no movements and stayed in the dining_room for 1 minute, so she did not interact with anyone. Evelyn moved the cucumber to the red_envelope, so she knows where it is. Charlotte moved the cucumber to the red_crate, so she also knows where it is. William made no movements and stayed in the dining_room for 1 minute, so he did not interact with anyone. Jacob moved the cucumber to the green_treasure_chest, so he knows where it is. + +Step 5: Determine who trusts whom. According to the assumption, an agent tends to trust an agent that exited the room later than himself. Therefore, Jacob trusts Charlotte, Charlotte trusts Evelyn, and Evelyn trusts Ava. + +Step 6: Determine where Jacob thinks Charlotte thinks Ava thinks Evelyn thinks the cucumber is. Since Jacob trusts Charlotte, he will assume that Charlotte knows where the cucumber is. Since Charlotte trusts Evelyn, she will assume that Evelyn knows where the cucumber is. Since Evelyn trusts Ava, she will assume that Ava knows where the cucumber is. However, Ava did not interact with anyone who moved the cucumber, so she does not know where it is. Therefore, Jacob will think that Charlotte thinks Ava thinks Evelyn thinks the cucumber is in the red_crate (option I), since that was the last place Charlotte moved it to before leaving the dining_room. + +Answer: I. red_crate. + +a: 5 6 7 9 2 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_10/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..97248c69d329a1d0253eed5e3efcb1c568b2a4ae --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_10/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where is the orange really? +Answer: red_container +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: To solve this question, we need to track the movements of each agent and the location of the orange. According to the story, Hannah, Jack, Alexander, Chloe, and Aiden entered the master_bedroom. Hannah made no movements and stayed in the master_bedroom for 1 minute before exiting. Jack moved the orange to the blue_treasure_chest and then exited. Alexander made no movements and stayed in the master_bedroom for 1 minute before exiting. Chloe moved the orange to the red_container and then exited. Aiden made no movements and stayed in the master_bedroom for 1 minute before exiting. Therefore, the orange is in the red_container. + +The answer is A. red_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_10/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..199d74430a840b8ef6e4ae744a9dda9c6f675136 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_10/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Hannah really think the orange is? +Answer: red_pantry +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: To answer this question, we need to track the movements of the orange and who moved it. According to the story, the orange was initially in the red_pantry, then Jack moved it to the blue_treasure_chest, and finally Chloe moved it to the red_container. Hannah made no movements with the orange. However, we cannot assume that Hannah's thoughts match her actions, as the agents tend to lie. We also cannot infer her thoughts based on private or public interactions, as there is no mention of any such interactions involving Hannah and the orange. Therefore, we need to consider the exit order of the agents. Aiden exited the front yard last, followed by Hannah and Jack. As per the assumption, agents tend to trust an agent that exited the room later than themselves. Therefore, Hannah may trust Aiden's exit order and believe that the orange is in the green_pantry, where Aiden moved the pear. Therefore, the answer is J. green_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_10/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1ab909259171e24682fda52ec2458c5317964ee7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_10/order_2.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Aiden think Hannah thinks the orange is? +Answer: red_pantry +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: To answer this question, we need to track the movements of the orange and the agents. First, Hannah, Jack, Alexander, Chloe, and Aiden entered the master_bedroom. Then, the orange was in the red_pantry. Hannah made no movements and stayed in the master_bedroom for 1 minute before exiting. Jack moved the orange to the blue_treasure_chest and then exited. Alexander made no movements and stayed in the master_bedroom for 1 minute before exiting. Chloe moved the orange to the red_container and then exited. Aiden made no movements and stayed in the master_bedroom for 1 minute before exiting. + +Next, Aiden, Hannah, and Jack entered the front_yard. The pear was in the red_box. Aiden moved the pear to the green_pantry and then exited. Hannah moved the pear to the green_envelope and then exited. Jack made no movements and stayed in the front_yard for 1 minute before exiting. Finally, Aiden, Hannah, and Jack entered the waiting_room. + +Based on the assumption that agents tend to lie, we cannot trust what any of the agents say about the location of the orange. However, we can infer where Aiden thinks Hannah thinks the orange is based on their movements. Aiden was the last to exit the master_bedroom, so he would tend to trust the agents who exited after him more than those who exited before him. Chloe was the last to move the orange, so Aiden would tend to trust her more than Jack or Alexander. Chloe moved the orange to the red_container, so Aiden would think that Hannah thinks the orange is in the red_container. + +Therefore, the answer is A. red_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_10/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..188fca4d55178656acfc985dcddc9e03f23abd6f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_10/order_3.txt @@ -0,0 +1,63 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Jack think Aiden thinks Hannah thinks the orange is? +Answer: red_pantry +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Where does Jack think Aiden thinks Hannah thinks the orange is? + +2. We know that the orange was initially in the red_pantry, but was moved by Jack to the blue_treasure_chest and then by Chloe to the red_container. + +3. Hannah made no movements and stayed in the master_bedroom for 1 minute, so she did not move the orange. + +4. Aiden was not present when the orange was moved, but he did move the pear from the red_box to the green_pantry. + +5. Jack made no movements in the waiting_room or front_yard, but he did move the orange to the blue_treasure_chest. + +6. Based on the assumptions, we know that Jack tends to trust Aiden more than Hannah because Aiden exited the master_bedroom after Jack did. + +7. However, we do not know what Aiden thinks about the location of the orange, as he did not witness its movements. + +8. Therefore, we need to consider what information Aiden could have inferred from his interactions with the other agents. + +9. Aiden and Hannah were both in the front_yard, where the pear was moved from the red_box to the green_pantry. + +10. Hannah moved the pear to the green_envelope before exiting the front_yard. + +11. Therefore, Aiden could infer that Hannah knew the location of the pear and may have some knowledge about the location of the orange. + +12. However, we do not know if Aiden actually communicated with Hannah about the orange. + +13. Based on these observations, we can eliminate options that do not make sense based on the movements of the agents and the location of the orange and pear. + +14. We can also eliminate options that rely on Aiden's direct knowledge of the orange's location, as he did not witness its movements. + +15. Therefore, the most likely answer is that Jack thinks Aiden thinks Hannah thinks the orange is in the red_container, as this is the location where the orange was last seen before Aiden entered the waiting_room. + +16. However, it is important to note that this answer is based on assumptions and inferences, and may not be the correct answer if the agents were lying or had different thought processes than expected. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_10/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..79ad7352409040f266eb76ac932c71ccaad239fb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_10/order_4.txt @@ -0,0 +1,66 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Alexander think Jack thinks Aiden thinks Hannah thinks the orange is? +Answer: red_pantry +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Where does Alexander think Jack thinks Aiden thinks Hannah thinks the orange is? + +2. We know that the orange was initially in the red_pantry (step 2). + +3. Hannah did not move the orange (step 3), so she does not have any thoughts about where it is. + +4. Jack moved the orange to the blue_treasure_chest (step 5). + +5. Alexander did not move the orange (step 7), but he knows that Jack moved it to the blue_treasure_chest. + +6. Chloe moved the orange to the red_container (step 9), but Alexander did not witness this. + +7. Aiden did not move the orange (step 11), but he knows that Chloe moved it to the red_container (step 9). + +8. Aiden, Hannah, and Jack later moved to the front_yard (step 14). + +9. The pear was initially in the red_box (step 15). + +10. Aiden moved the pear to the green_pantry (step 16). + +11. Hannah moved the pear to the green_envelope (step 18). + +12. Jack did not move the pear (step 20). + +Based on these steps, we can infer that: + +- Alexander knows that Jack moved the orange to the blue_treasure_chest. +- Aiden knows that Chloe moved the orange to the red_container. +- Hannah knows where the pear is (in the green_envelope). +- Jack does not have any thoughts about where the orange or pear is. + +So, where does Alexander think Jack thinks Aiden thinks Hannah thinks the orange is? We know that Alexander knows that Jack moved the orange to the blue_treasure_chest, but we don't know what Aiden or Hannah think about the orange's location. Therefore, we cannot determine where Alexander thinks Jack thinks Aiden thinks Hannah thinks the orange is. + +The answer is: Cannot be determined. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_11/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9fff14d37c5820f32c206ed50b0586da748634c1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_11/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where is the cherry really? +Answer: blue_suitcase +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to follow the movements of the agents and determine where the cherry ended up. Emily moved the cherry to the red_container, and then exited the pantry. Lily made no movements and stayed in the pantry for 1 minute before exiting. Emma then moved the cherry to the green_envelope before exiting the pantry. Avery then moved the cherry to the blue_suitcase before exiting the pantry. Finally, Ella made no movements and stayed in the pantry for 1 minute before exiting. + +Based on this information, we know that the cherry was last seen in the blue_suitcase, as that is where Avery placed it before exiting the pantry. Therefore, the answer is H. blue_suitcase. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_11/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..95c86284b22829c4701901fb145810f98a8c366c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_11/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Avery really think the cherry is? +Answer: blue_suitcase +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: The question is asking for where Avery really thinks the cherry is. To answer this question, we need to track the movements of the cherry and who interacted with it. + +1. Emily moved the cherry to the red_container. +2. Lily made no movements and stayed in the pantry for 1 minute. +3. Emma moved the cherry to the green_envelope. +4. Avery moved the cherry to the blue_suitcase. + +Based on the assumptions given, we know that Avery can only infer Lily's thoughts if they were in the same place or had private/public interactions. However, Lily made no movements and stayed in the pantry for 1 minute, so Avery cannot infer her thoughts. + +Therefore, Avery's belief about the location of the cherry can only be based on his own interactions with it. The last interaction with the cherry was when Avery moved it to the blue_suitcase. Therefore, Avery really thinks the cherry is in the blue_suitcase. + +The answer is H. blue_suitcase. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_11/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..26bfbafc25483cb7c4be888a691e5c5f172fd2b2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_11/order_2.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Lily think Avery thinks the cherry is? +Answer: red_container +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: To answer this question, we need to track the movements of Lily and Avery and their interactions. Lily entered the pantry with Emily, Emma, Avery, and Ella. She made no movements and stayed in the pantry for 1 minute before exiting. Avery moved the cherry to the blue_suitcase before exiting the pantry. Later, Lily, Avery, and Ella entered the cellar where Avery moved the tomato to the red_bucket. Lily likes the red_drawer. + +Based on the assumptions, we know that Lily can only infer Avery's thought if they have been in the same place or have private or public interactions. Lily and Avery were both in the pantry, but there is no evidence of any interaction between them. Therefore, Lily cannot infer Avery's thought about the cherry based on their time in the pantry. + +In the cellar, Avery moved the tomato to the red_bucket, which may give Lily a clue about Avery's thought process. However, there is no evidence of any interaction between Lily and Avery in the cellar. Therefore, Lily cannot infer Avery's thought about the cherry based on their time in the cellar. + +Since Lily likes the red_drawer and Avery moved the cherry to the blue_suitcase, it is unlikely that Lily would think Avery thinks the cherry is in the blue_suitcase. Therefore, we can eliminate option H. + +Based on the movements of the agents and the assumptions, the only logical answer is F. Lily thinks Avery thinks the cherry is in the red_container because that is where Emily moved the cherry before exiting the pantry, and Avery did not move the cherry to a different location before exiting the pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_11/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f87b0692fb461f81646cb0738788e55dcbb03cdb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_11/order_3.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Ella think Lily thinks Avery thinks the cherry is? +Answer: red_container +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Ella think Lily thinks Avery thinks the cherry is? + +2. To answer this question, we need to start with the cherry's location. According to the story, the cherry was initially in the red_drawer, but Emily moved it to the red_container. Later, Emma moved it to the green_envelope, and Avery moved it to the blue_suitcase. None of the agents moved the cherry again after that. + +3. Next, we need to consider Lily's movements. She entered the pantry with Emily, Emma, Avery, and Ella, but made no movements and stayed there for 1 minute. She then exited the pantry and later entered the cellar with Avery and Ella. She made no movements in the cellar and stayed there for 1 minute before exiting with Avery and Ella. + +4. We also need to consider Avery's movements, as Ella's thoughts about Lily's thoughts are based on what Avery thinks. Avery entered the pantry with Emily, Lily, Emma, and Ella, and moved the cherry to the blue_suitcase before exiting. Later, she entered the cellar with Lily and Ella, and moved the tomato to the red_bucket before exiting with Lily and Ella. + +5. Based on these movements, we can eliminate several options for where Ella thinks Lily thinks Avery thinks the cherry is. For example, we know that the cherry is not in the green_bucket, red_crate, green_bathtub, blue_treasure_chest, blue_pantry, red_basket, blue_crate, or blue_cupboard, as none of the agents moved the cherry to those locations. + +6. We can also eliminate some options based on Lily's movements. Since Lily made no movements in the pantry, she could not have seen where Emily moved the cherry to. Therefore, she could not have known that the cherry was in the red_container. Similarly, since Lily made no movements in the cellar before Avery moved the tomato to the red_bucket, she could not have seen where the cherry was moved to by Avery. + +7. This leaves us with two options: red_drawer and red_container. Since Lily likes the red_drawer (according to assumption 3), it is possible that she thinks Avery thinks the cherry is there. However, since Avery moved the cherry to the blue_suitcase before exiting the pantry, it is also possible that Lily thinks Avery thinks the cherry is in the red_container. + +8. Finally, we need to consider where Ella thinks Lily thinks Avery thinks the cherry is. Since Ella made no movements in either the pantry or the cellar, she could not have seen where the cherry was moved to. Therefore, her thoughts about where Lily thinks Avery thinks the cherry is are based on her assumptions about Lily's thought process. + +9. Based on assumption 4, Ella would tend to trust Avery's thoughts about the cherry's location, since Avery exited the pantry after Lily did. Therefore, it is likely that Ella thinks Lily thinks Avery thinks the cherry is in the red_container, since that is where Avery moved it to before exiting the pantry. + +10. Therefore, the answer to the question is F. red_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_11/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c42717e5ee5cd28006f61bbefcaf3f10c0e85de6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_11/order_4.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Emily think Ella thinks Lily thinks Avery thinks the cherry is? +Answer: red_container +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Emily think Ella thinks Lily thinks Avery thinks the cherry is? + +2. To answer this question, we need to start with the cherry's location. According to the story, the cherry was initially in the red_drawer, but Emily moved it to the red_container. + +3. Next, we need to determine who knows about the cherry's location. Emily, Lily, Emma, Avery, and Ella were all in the pantry when the cherry was moved, so they all know that it was moved from the red_drawer to the red_container. + +4. Lily and Ella did not make any movements in the pantry, so they did not move the cherry or witness anyone else moving it. + +5. Emma moved the cherry from the red_container to the green_envelope, and Avery moved it from the green_envelope to the blue_suitcase. + +6. Based on the assumption that agents tend to trust those who exited a room later than themselves, we can assume that Avery trusts Ella's knowledge of the cherry's location more than Lily's knowledge. + +7. Therefore, we need to determine where Ella thinks Avery thinks the cherry is. Avery moved the cherry to the blue_suitcase, so Ella knows that the cherry is in the blue_suitcase. + +8. We also need to determine where Lily thinks Avery thinks the cherry is. Lily did not witness Avery moving the cherry, but she knows that Ella stayed in the cellar with Avery after Lily left. Therefore, Lily may assume that Avery moved the cherry to the same location as Ella (the blue_suitcase). + +9. Finally, we need to determine where Emily thinks Ella thinks Lily thinks Avery thinks the cherry is. Emily knows that the cherry was moved from the red_drawer to the red_container, but she did not witness any of the subsequent movements. Therefore, she may assume that the cherry is still in the red_container. + +10. However, Emily also knows that Avery moved the tomato to the red_bucket in the cellar, and that Lily likes the red_drawer. Therefore, she may also assume that Lily thinks the cherry is in the red_drawer. + +11. Based on these assumptions, we can conclude that Emily may think that Ella thinks Lily thinks Avery thinks the cherry is either in the blue_suitcase or the red_drawer. + +12. Therefore, the answer to the question is either H. blue_suitcase or G. red_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_12/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ae30003725d46e162cf7b43e131955769c8ba6c1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_12/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where is the pear really? +Answer: red_bucket +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: To answer this question, we need to track the movements of each agent and their actions. According to the story, the pear was initially in the red_box in the pantry. Charlotte moved the pear to the red_bucket before exiting the pantry. None of the other agents made any movements towards the pear. Therefore, the pear is in the red_bucket. The correct answer is M. red_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_12/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cafb1c31ca32509190f0bcd8947a96c3e036b14f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_12/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does Charlotte really think the pear is? +Answer: red_bucket +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: To answer this question, we need to track Charlotte's movements and any interactions she had with other agents. According to the story, Charlotte moved the pear to the red_bucket in the pantry, but later moved the asparagus to the red_pantry in the office. There is no mention of Charlotte interacting with any other agents about the location of the pear. Therefore, based on the given information, Charlotte really thinks the pear is in the M. red_bucket. The answer is M. red_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_12/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..358d2eb6919a42c5a99fb33b1e8ce529b06a780d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_12/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does Alexander think Charlotte thinks the pear is? +Answer: red_bucket +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: To answer this question, we need to track the movements of Alexander and Charlotte and their interactions. We know that Alexander, Charlotte, and Ava entered the office together, and Alexander moved the asparagus to the red_drawer. Then Charlotte moved the asparagus to the red_pantry before exiting the office. We don't have any information about their private or public interactions regarding the location of the pear. However, we know that the pear is in the red_box, which was the initial location when all five agents entered the pantry. Therefore, Alexander should think that Charlotte thinks the pear is in the red_box. The answer is L. red_box. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_12/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..51d44dbaf7a502f3ce91d8d5f8ec9b65bb723ffd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_12/order_3.txt @@ -0,0 +1,62 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does Ava think Alexander thinks Charlotte thinks the pear is? +Answer: red_box +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: The question is asking for Ava's thoughts about Alexander's thoughts about Charlotte's thoughts on the location of the pear. To answer this question, we need to track the movements of each agent and their interactions with each other. + +1. William, Ava, Charlotte, Avery, and Alexander entered the pantry. +2. The pear is in the red_box. +3. William made no movements and stayed in the pantry for 1 minute. +4. William exited the pantry. +5. Ava made no movements and stayed in the pantry for 1 minute. +6. Ava exited the pantry. +7. Charlotte moved the pear to the red_bucket. +8. Charlotte exited the pantry. +9. Avery made no movements and stayed in the pantry for 1 minute. +10. Avery exited the pantry. +11. Alexander made no movements and stayed in the pantry for 1 minute. +12. Alexander exited the pantry. +13. William, Ava, Charlotte, Avery, and Alexander entered the waiting_room. +14. Alexander, Charlotte, and Ava entered the office. +15. The asparagus is in the red_basket. +16. Alexander moved the asparagus to the red_drawer. +17. Avery dislikes the pear. +18. Alexander exited the office. +19. Charlotte moved the asparagus to the red_pantry. +20. Charlotte exited the office. +21. Avery dislikes the cabbage. +22. Ava made no movements and stayed in the office for 1 minute. +23. Ava exited the office. +24. Alexander, Charlotte, and Ava entered the waiting_room. + +Based on the story, Ava and Alexander were both in the office together, but there is no mention of them having any private or public interactions. Therefore, Ava cannot infer Alexander's thoughts about Charlotte's thoughts on the location of the pear. + +The location of the pear was last mentioned in step 8, where Charlotte moved it to the red_bucket. There is no mention of Charlotte moving the pear again or anyone else moving it. Therefore, the answer is M. red_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_12/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..22d6685c525abf9f64f743b8b8ecf04e43d77ff9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_12/order_4.txt @@ -0,0 +1,97 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does William think Ava thinks Alexander thinks Charlotte thinks the pear is? +Answer: red_box +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does William think Ava thinks Alexander thinks Charlotte thinks the pear is? + +2. We know that the pear is in the red_box (step 2). + +3. William made no movements and stayed in the pantry for 1 minute (step 3). + +4. William exited the pantry (step 4). + +5. Ava made no movements and stayed in the pantry for 1 minute (step 5). + +6. Ava exited the pantry (step 6). + +7. Charlotte moved the pear to the red_bucket (step 7). + +8. Charlotte exited the pantry (step 8). + +9. Avery made no movements and stayed in the pantry for 1 minute (step 9). + +10. Avery exited the pantry (step 10). + +11. Alexander made no movements and stayed in the pantry for 1 minute (step 11). + +12. Alexander exited the pantry (step 12). + +13. William, Ava, Charlotte, Avery and Alexander entered the waiting_room (step 13). + +14. Alexander, Charlotte and Ava entered the office (step 14). + +15. The asparagus is in the red_basket (step 15). + +16. Alexander moved the asparagus to the red_drawer (step 16). + +17. Avery dislikes the pear (step 17). + +18. Alexander exited the office (step 18). + +19. Charlotte moved the asparagus to the red_pantry (step 19). + +20. Charlotte exited the office (step 20). + +21. Avery dislikes the cabbage (step 21). + +22. Ava made no movements and stayed in the office for 1 minute (step 22). + +23. Ava exited the office (step 23). + +24. Alexander, Charlotte and Ava entered the waiting_room (step 24). + +Based on these steps, we can infer that: + +- William was in the pantry when the pear was in the red_box, but he made no movements and did not witness Charlotte moving the pear to the red_bucket. +- Ava was also in the pantry when the pear was in the red_box, but she made no movements and did not witness Charlotte moving the pear to the red_bucket. +- Alexander was in the pantry when the pear was in the red_box, but he made no movements and did not witness Charlotte moving the pear to the red_bucket. +- Charlotte moved the pear from the red_box to the red_bucket, but we don't know what she thinks about where the pear is. +- Avery dislikes the pear, but we don't know where he thinks it is. +- The asparagus is in the red_basket, but we don't know what William, Ava, or Charlotte think about where it is. +- Alexander moved the asparagus to the red_drawer, but we don't know what William, Ava, or Charlotte think about where it is. +- Charlotte moved the asparagus to the red_pantry, but we don't know what William, Ava, or Alexander think about where it is. +- Ava was in the office for 1 minute, but we don't know what she did or saw. +- Alexander, Charlotte, and Ava were in the office together, but we don't know what they discussed or what they think about where the pear or asparagus is. +- William, Ava, Charlotte, Avery, and Alexander were all in the waiting_room together, but we don't know what they think about where the pear or asparagus is. + +Given all of this information, we cannot determine where William thinks Ava thinks Alexander thinks Charlotte thinks the pear is. The question is too complex and there is not enough information to make a definitive answer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_13/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..16d08c19a10a0065befbdc4509b53ca7e422d0bb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_13/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where is the watermelon really? +Answer: green_basket +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: To answer this question, we need to track the movements of each agent and their statements. According to the story, Avery made no movements in the workshop and dislikes the tomato. Sophia moved the watermelon to the green_envelope and then exited the workshop. Carter moved the watermelon to the green_basket and then exited the workshop. Therefore, the watermelon could be in either the green_envelope or the green_basket. However, we need to consider the exit order as well. Carter exited the workshop after Sophia, so we can trust his statement more than Sophia's. Therefore, the watermelon is most likely in the green_basket. The answer is D. green_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_13/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f8cbad2fd65e4bbe7a144830c7f25a9acd4980c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_13/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Carter really think the watermelon is? +Answer: green_basket +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: To answer this question, we need to track the movements of the watermelon and Carter's movements. According to the story, the watermelon was initially in the blue_suitcase, then Sophia moved it to the green_envelope, and finally, Carter moved it to the green_basket. Carter exited the workshop after moving the watermelon to the green_basket. Since Carter exited the workshop after Avery, he tends to trust Avery's claim that he dislikes the tomato. Therefore, we can assume that Carter did not move the watermelon to the red_envelope, blue_bucket, green_cupboard, blue_treasure_chest, green_crate, red_drawer, green_drawer, green_treasure_chest, green_bathtub, red_bottle, or blue_pantry. The only option left is the green_basket, which is where Carter really thinks the watermelon is. Therefore, the answer is D. green_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_13/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..965a7cfb72ac79f7ec7932e6e95c5f81f2223b46 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_13/order_2.txt @@ -0,0 +1,39 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Avery think Carter thinks the watermelon is? +Answer: blue_suitcase +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to track Avery's movements and statements, as well as Carter's movements. Avery entered the workshop with Sophia, Carter, Emily, and Isla. Avery made no movements and stayed in the workshop for 1 minute before exiting. Sophia moved the watermelon to the green_envelope, and Carter moved the watermelon to the green_basket before exiting. Avery dislikes the tomato, but there is no mention of Avery's thoughts on the watermelon's location. + +Next, Avery, Sophia, Carter, Emily, and Isla entered the waiting_room. Carter likes the green_treasure_chest, but again, there is no mention of Avery's thoughts on the watermelon's location. + +Then, Emily, Isla, and Avery entered the sunroom. The carrot is in the blue_treasure_chest. Emily moved the carrot to the green_box, and Isla moved the carrot to the green_crate before exiting. Avery made no movements and stayed in the sunroom for 1 minute before exiting. Again, there is no mention of Avery's thoughts on the watermelon's location. + +Based on the given information, we cannot determine where Avery thinks Carter thinks the watermelon is. Therefore, the answer is not provided in the options given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_13/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..667216f5f9f3e25b33652eacbb96f4d65c0e2adc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_13/order_3.txt @@ -0,0 +1,61 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Isla think Avery thinks Carter thinks the watermelon is? +Answer: blue_suitcase +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. We need to find out where Isla thinks Avery thinks Carter thinks the watermelon is. This means we need to trace the path of the watermelon and see where each agent thinks it is. + +2. According to step 2, the watermelon is in the blue_suitcase. + +3. Avery made no movements and stayed in the workshop for 1 minute, so we can assume that Avery doesn't know that the watermelon has been moved. + +4. Sophia moved the watermelon to the green_envelope, so she knows that it's there. + +5. Carter moved the watermelon to the green_basket, so he knows that it's there. + +6. Isla made no movements and stayed in the workshop for 1 minute, so she doesn't know where the watermelon is. + +7. Now we need to figure out what each agent thinks about the watermelon's location. According to assumption 2, Isla can only infer Avery's thoughts if they have been in the same place or have had private or public interactions. + +8. Avery dislikes the tomato, but we don't know what he thinks about the watermelon's location. + +9. Carter likes the green_treasure_chest, but we don't know what he thinks about the watermelon's location. + +10. Emily moved the carrot to the green_box, so she knows where the carrot is but we don't know what she thinks about the watermelon's location. + +11. Isla moved the carrot to the green_crate, so she knows where the carrot is but we don't know what she thinks about the watermelon's location. + +12. Based on assumption 4, Isla would trust Avery's opinion more than Carter's since Avery exited the sunroom after Carter. + +13. Therefore, Isla would think that Avery thinks the watermelon is in the green_basket, since that's where Carter moved it and Avery would have seen it there if he had exited the workshop after Carter. + +14. The answer is D. green_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_13/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ec9f8f0b0e55079b33c79bf688942fa50be7e222 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_13/order_4.txt @@ -0,0 +1,55 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Sophia think Isla thinks Avery thinks Carter thinks the watermelon is? +Answer: blue_suitcase +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Where does Sophia think Isla thinks Avery thinks Carter thinks the watermelon is? + +2. We know that the watermelon was initially in the blue_suitcase, but was moved by Sophia to the green_envelope and then by Carter to the green_basket. + +3. Avery made no movements in the workshop, so we don't know where she thinks the watermelon is. + +4. Isla also made no movements in the workshop, so we don't know where she thinks the watermelon is either. + +5. Sophia moved the watermelon to the green_envelope, so we know that she thinks the watermelon is in the green_envelope. + +6. Carter moved the watermelon to the green_basket, so we know that he thinks the watermelon is in the green_basket. + +7. Based on assumption (4), Isla would trust Avery's opinion more than Sophia's or Carter's, since Avery exited the workshop after Isla did. + +8. However, we don't know where Avery thinks the watermelon is, since she made no movements in the workshop. + +9. Therefore, we cannot determine where Isla thinks Avery thinks Carter thinks the watermelon is. + +10. The correct answer is: Cannot be determined. + +It's important to carefully analyze the story and assumptions, and to eliminate any options that are not supported by the information given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_14/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3e182833c1ad173a25b6bee1bcb047fb9135fb64 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_14/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where is the lemon really? +Answer: green_bottle +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to trace the movements of the lemon and the agents. According to the story, the lemon was initially in the red_box (statement 2). Then, Evelyn moved the lemon to the red_container (statement 3). After that, Alexander moved the lemon to the green_treasure_chest (statement 7). Finally, Emma moved the pear to the blue_treasure_chest (statement 18). Therefore, the lemon is in the green_treasure_chest (option M). The correct answer is M. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_14/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..970aba0723292161672dad60ac246e1d5c7ba422 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_14/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Isla really think the lemon is? +Answer: red_container +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: To answer this question, we need to trace Isla's movements and the movements of the lemon. Isla entered the hall with Evelyn, Alexander, Emma, and Sophia. The lemon was initially in the red_box. Evelyn moved the lemon to the red_container before exiting the hall. Isla made no movements and stayed in the hall for 1 minute before exiting. Alexander then moved the lemon to the green_treasure_chest before exiting the hall. Emma then moved the lemon to the green_bottle before exiting the hall. Sophia made no movements and stayed in the hall for 1 minute before exiting. Isla did not move the lemon, so it should still be in the last place it was moved to, which is the green_bottle. Therefore, the answer is K. green_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_14/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4a80073aa65aa542fe4df7cf3b8d26a2ae91324a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_14/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Sophia think Isla thinks the lemon is? +Answer: red_container +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: To answer this question, we need to track the movements of the lemon and the agents' exits from the hall and TV room. + +According to the story, Evelyn moved the lemon to the red_container in the hall, then left. Isla made no movements in the hall before leaving. Alexander moved the lemon to the green_treasure_chest in the hall, then left. Emma moved the lemon to the green_bottle in the hall, then left. Sophia made no movements in the hall before leaving. + +Next, Alexander, Emma, and Evelyn entered the TV room. The pear is in the red_basket. Alexander made no movements in the TV room before leaving. Emma moved the pear to the blue_treasure_chest in the TV room, then left. Evelyn made no movements in the TV room before leaving. + +Finally, Alexander, Emma, and Evelyn entered the waiting room. + +Based on this information, we know that Isla did not move the lemon in the hall. Therefore, Sophia cannot think that Isla thinks the lemon is in the red_container, as that was Evelyn's action. + +Sophia also did not move the lemon in the hall, so she cannot know its current location based on her own actions. + +However, Sophia knows that Alexander moved the lemon to the green_treasure_chest in the hall, and Emma moved it to the green_bottle in the hall. Therefore, Sophia could think that Isla thinks the lemon is in the green_crate (option C) or the green_bottle (option K), as those are the last two locations the lemon was seen in before the agents left the hall. + +Therefore, the answer is either C or K, depending on Sophia's thought process. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_14/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cad167862aa91b3dae97e59388352b8f70e0b24a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_14/order_3.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Evelyn think Sophia thinks Isla thinks the lemon is? +Answer: red_container +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: To answer this question, we need to trace the movements of each agent and their interactions. + +- Evelyn moved the lemon to the red_container before exiting the hall. +- Isla made no movements and stayed in the hall for 1 minute before exiting. +- Alexander moved the lemon to the green_treasure_chest before exiting the hall. +- Emma moved the lemon to the green_bottle before exiting the hall. +- Sophia made no movements and stayed in the hall for 1 minute before exiting. + +Then, all five agents entered the waiting_room and later, Alexander, Emma, and Evelyn entered the TV_room. + +- The pear is in the red_basket. +- Alexander made no movements and stayed in the TV_room for 1 minute before exiting. +- Emma moved the pear to the blue_treasure_chest before exiting the TV_room. +- Emma dislikes the eggplant. +- Evelyn made no movements and stayed in the TV_room for 1 minute before exiting. + +Finally, all three agents entered the waiting_room again. + +Based on these movements and assumptions, we can infer that Evelyn only interacted with Isla and Sophia in the hall before they all exited. Therefore, she cannot infer what Isla thinks about the lemon's location since Isla made no movements and they had no interactions. + +Sophia also made no movements and stayed in the hall for 1 minute before exiting. Therefore, she cannot have any information about the lemon's location other than its initial placement in the red_box. + +Therefore, Evelyn cannot infer what Sophia thinks about the lemon's location. The answer is not provided in the multiple-choice options. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_14/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c95d4c71eb14b147c298d30d2e1a25bd82771308 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_14/order_4.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Alexander think Evelyn thinks Sophia thinks Isla thinks the lemon is? +Answer: red_container +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Alexander think Evelyn thinks Sophia thinks Isla thinks the lemon is? + +We need to trace the thought process of each agent to determine where they think the lemon is. Starting with Isla, we know that she made no movements and stayed in the hall for 1 minute, so she did not interact with the lemon. Sophia also made no movements and stayed in the hall for 1 minute, so she did not interact with the lemon either. This means that Isla and Sophia have no information about the lemon's location. + +Moving on to Evelyn, we know that she moved the lemon to the red_container before exiting the hall. Therefore, she knows that the lemon is in the red_container. However, we don't know what she thinks about where Isla or Sophia think the lemon is. + +Finally, we come to Alexander. We know that he moved the lemon to the green_treasure_chest before exiting the hall. Therefore, he knows that the lemon is in the green_treasure_chest. But what does he think about where Evelyn, Sophia, and Isla think the lemon is? + +2. An agent tends to trust an agent that exited the room later than himself. + +We know that Alexander exited the hall after Evelyn, so he tends to trust her more than Sophia or Isla. Therefore, he is more likely to believe that Evelyn knows where the lemon is than the other two. + +3. An agent can infer another agent's thought only if they have been in the same place or have private or public interactions. + +We know that Alexander, Evelyn, and Sophia were all in the TV_room together, so they could have had private or public interactions. However, Isla was not present, so Alexander cannot infer her thoughts about the lemon's location. + +4. Every agent tends to lie. + +This means that we cannot trust what any of the agents say about where they think the lemon is. We have to rely on their actions and the assumptions above to determine where they actually think the lemon is. + +Putting all of this together, we can conclude that Alexander thinks Evelyn thinks the lemon is in the red_container (where she actually moved it to), but he cannot infer what Sophia or Isla think about the lemon's location. Therefore, the answer is O. red_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_15/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ce2a44b918c1de5583ec3d254c3fd4d89feedf36 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_15/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where is the corn really? +Answer: green_bucket +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: To answer this question, we need to track the movements of the corn and which agents were involved. According to the story, the corn was initially in the red_basket (step 2), then moved to the green_bathtub by Hannah (step 3), then moved back to the red_basket by Avery (step 13). Finally, Abigail moved the corn to the green_bucket (step 21). Therefore, the corn is really in the green_bucket. The answer is E. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_15/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..eb32b83ca35a1046c8337af61c03e30679818a9c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_15/order_1.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Abigail really think the corn is? +Answer: green_bucket +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: To answer this question, we need to track the movements of the corn and the agents. According to the story, the corn was initially in the red_basket (step 2), then Hannah moved it to the green_bathtub (step 3), and Avery moved it back to the red_basket (step 13). Later, Abigail entered the basement with Hannah and William (step 17), and moved the corn to the green_bucket (step 21). Abigail then exited the basement (step 22), followed by William (step 24) and Hannah (step 25). + +Based on the assumption that agents tend to lie, we cannot trust what Abigail says about the location of the corn. However, we can infer her actual thought based on her movements and interactions with other agents. Since Abigail was in the basement with Hannah and William when the corn was moved to the green_bucket, and she exited the basement before them, she would tend to trust their claim that the corn was in the green_bucket. Therefore, the answer is E. green_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_15/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..94f2a6bc5f9a8d9de637d9ae3d3c5b8bd4e60b1d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_15/order_2.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Nathan think Abigail thinks the corn is? +Answer: green_bathtub +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: To answer this question, we need to track the movements of Nathan and Abigail in relation to the corn. We know that the corn was initially in the red_basket, then moved to the green_bathtub by Hannah, and then moved back to the red_basket by Avery. Later, Abigail entered the basement and made a movement with the corn, moving it to the green_bucket. Nathan also entered the basement but made no movements with the corn before exiting. + +Based on the assumptions given, we know that Nathan can only infer Abigail's thoughts if they had private or public interactions. We also know that agents tend to lie, so we cannot trust what they say to each other. + +Therefore, we cannot determine where Nathan thinks Abigail thinks the corn is with certainty. It could be in the green_bucket, as that is where Abigail moved it to, but Nathan may not have had any interactions with Abigail to know this. It could also be in the red_basket, as that is where the corn was when Nathan first entered the basement. + +The correct answer is either A. red_basket or E. green_bucket, but we cannot determine which one with certainty based on the given information. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_15/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c28e0880d65d7074f721bbcc42c400f28acd3a0f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_15/order_3.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Avery think Nathan thinks Abigail thinks the corn is? +Answer: green_bathtub +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: To answer this question, we need to track the movements of Avery, Nathan, and Abigail in relation to the corn. From the story, we know that the corn starts in the red_basket, is moved to the green_bathtub by Hannah, then moved back to the red_basket by Avery. Abigail later moves the corn to the green_bucket. + +We also know that Nathan loses his watch in the waiting_room and that Hannah, Abigail, and William enter the basement after this happens. However, we don't have any information about where Nathan thinks the corn is. + +Since Avery is the only one who moves the corn after Nathan loses his watch, we can assume that Nathan doesn't know that the corn has been moved to the green_bucket by Abigail. Therefore, Avery must think that Nathan thinks the corn is still in the red_basket. + +However, the question is asking where Avery thinks Nathan thinks Abigail thinks the corn is. We don't have any information about private or public interactions between Avery and Nathan, so we can't be sure what Avery thinks Nathan thinks. Therefore, the answer to the question is A. red_basket, since that is the only location we can be sure Nathan knows the corn is in. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_15/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..696c57fc69a6a08e736f8d865ddde92d18ca8ab3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_15/order_4.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Hannah think Avery thinks Nathan thinks Abigail thinks the corn is? +Answer: green_bathtub +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: To answer this question, we need to trace the movements and thoughts of each agent. + +1. Hannah moved the corn from the red_basket to the green_bathtub and dislikes the corn. +2. Avery likes the green_crate. +3. William made no movements in the basement. +4. Abigail moved the corn from the green_bathtub to the green_bucket. +5. Nathan made no movements in the basement and lost his watch in the waiting_room. + +Since Avery never interacted with the corn, we can eliminate any options that involve Avery's direct thoughts about the corn. + +Next, we need to determine where Nathan thinks the corn is. Since Nathan made no movements in the basement, he would not know that Abigail moved the corn to the green_bucket. Therefore, Nathan would still think the corn is in the red_basket. + +Abigail moved the corn to the green_bucket, but we need to determine where she thinks the corn is. Since Hannah was the last person to exit the basement before Abigail, Abigail would trust Hannah's claim about the location of the corn. Therefore, Abigail would also think the corn is in the green_bucket. + +Finally, we need to determine where Hannah thinks Abigail thinks the corn is. Since Hannah moved the corn to the green_bathtub and dislikes the corn, she would not trust Abigail's claim about the location of the corn. Therefore, Hannah would still think the corn is in the red_basket. + +Based on this analysis, the answer is A. red_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_16/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6910b70eb3d8c71f6461168bfcc6b340a869d2ba --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_16/order_0.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where is the tangerine really? +Answer: green_bottle +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to track the movements of the tangerine and the agents. Here are the steps to solve the question: + +1. Liam moved the tangerine from the green_bottle to the blue_treasure_chest. +2. Jackson moved the tangerine from the blue_treasure_chest to the green_bathtub. +3. Benjamin moved the tangerine from the green_bathtub to the red_bucket. +4. Sophia moved the tangerine from the red_bucket to the green_bottle. + +Therefore, the tangerine is really in the green_bottle. The answer is L. green_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_16/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..dbc5ef62df84e041f00e1fe5f17b4d9837d8a323 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_16/order_1.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Benjamin really think the tangerine is? +Answer: red_bucket +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: To answer this question, we need to track the movements of the tangerine and the agents' thoughts. Here are the steps to solve the question: + +1. Liam moved the tangerine to the blue_treasure_chest. +2. Jackson moved the tangerine to the green_bathtub. +3. Benjamin moved the tangerine to the red_bucket. +4. Sophia moved the tangerine to the green_bottle. +5. Liam exited the den. +6. Jackson exited the den. +7. Carter made no movements and stayed in the den for 1 minute. +8. Benjamin exited the den. +9. Benjamin moved the plum to the green_crate. +10. Liam moved the plum to the red_drawer. +11. Jackson dislikes the tangerine. +12. Carter made no movements and stayed in the bathroom for 1 minute. +13. Benjamin lost his phone. +14. Carter exited the bathroom. +15. Benjamin, Liam and Carter entered the waiting_room. + +Based on the assumptions, we know that Benjamin can only infer the thoughts of Liam, Jackson, and Sophia since he was in the same room as them when they moved the tangerine. We also know that agents tend to lie, so we cannot trust what they say to each other. + +From the story, we know that Benjamin moved the tangerine to the red_bucket, but we don't know if he thinks it's still there. We also know that Liam moved the plum to the red_drawer, but we don't know if Benjamin knows this. + +Therefore, we cannot determine where Benjamin really thinks the tangerine is based on the given information. The answer is inconclusive. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_16/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9e4d02814568dbdf17f9581d58cc527cc464758d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_16/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Liam think Benjamin thinks the tangerine is? +Answer: blue_treasure_chest +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: To answer this question, we need to track the movements of the tangerine and the agents' exits from the den and the bathroom. Liam moved the tangerine to the blue_treasure_chest and then exited the den. Jackson moved the tangerine to the green_bathtub and then exited the den. Carter made no movements and stayed in the den for 1 minute before exiting. Benjamin moved the tangerine to the red_bucket and then exited the den. Sophia moved the tangerine back to the green_bottle before exiting the den. Benjamin, Liam, and Carter then entered the bathroom, where Benjamin moved the plum to the green_crate and Liam moved it to the red_drawer before they all exited. Based on the assumption that agents tend to trust those who exited the room later than themselves, Liam would trust Benjamin's movements more than Jackson's or Sophia's. Therefore, Liam would think that Benjamin thinks the tangerine is in the red_bucket, as that was the last place Benjamin moved it before exiting the den. The answer is K. red_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_16/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6b2beb22cb824957eef125cec1c380b3ba783877 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_16/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Carter think Liam thinks Benjamin thinks the tangerine is? +Answer: blue_treasure_chest +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: To solve this question, we need to track the movements of the tangerine and the thoughts of the agents. According to the story, Liam moved the tangerine to the blue_treasure_chest, then Jackson moved it to the green_bathtub, Benjamin moved it to the red_bucket, and finally Sophia moved it back to the green_bottle. Carter made no movements related to the tangerine. + +We also know that Sophia dislikes the banana, and Jackson dislikes the tangerine. However, we don't have any information about the thoughts of Liam, Benjamin, or Carter regarding the tangerine. + +Since Carter made no movements related to the tangerine, we can assume that he doesn't have a strong opinion about its location. However, he may have overheard conversations or seen movements of other agents that could give him a clue about their thoughts. + +Based on the assumption that an agent tends to trust another agent who exited the room later than himself, we can assume that Carter trusts Benjamin more than Liam. This is because Benjamin exited the bathroom after Liam, and they both entered the waiting room together with Carter. + +Therefore, we need to determine where Benjamin thinks the tangerine is, and then assume that Carter thinks Liam thinks the same thing. According to the story, Benjamin moved the plum from the blue_suitcase to the green_crate, and then Liam moved it to the red_drawer. There is no information about Benjamin's thoughts regarding the tangerine. + +Since we don't have any information about Benjamin's thoughts regarding the tangerine, we cannot determine where he thinks it is. Therefore, we cannot determine where Carter thinks Liam thinks Benjamin thinks the tangerine is. The answer is not given in the options provided. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_16/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1de4635aad3722ffb306e02c9da40e788c3f345a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_16/order_4.txt @@ -0,0 +1,58 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Jackson think Carter thinks Liam thinks Benjamin thinks the tangerine is? +Answer: blue_treasure_chest +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: To solve this question, we need to track the movements of the tangerine and the thoughts of each character. + +- Liam moved the tangerine to the blue_treasure_chest. +- Jackson moved the tangerine to the green_bathtub and dislikes the tangerine. +- Carter made no movements and stayed in the den for 1 minute, then exited. +- Benjamin moved the tangerine to the red_bucket. +- Sophia moved the tangerine to the green_bottle and dislikes the banana. +- Liam exited the den. +- Benjamin moved the plum to the green_crate. +- Liam moved the plum to the red_drawer. +- Jackson dislikes the tangerine. +- Carter made no movements and stayed in the bathroom for 1 minute, then exited. +- Benjamin lost his phone. + +Based on the assumptions, we know that Jackson can only infer Carter's thoughts if they have been in the same place or had private/public interactions. We also know that agents tend to lie, so what they tell others doesn't necessarily reflect their actual thoughts. + +Since Jackson dislikes the tangerine, we can eliminate any options where the tangerine is located. We also know that Carter made no movements with the tangerine, so his thoughts about its location are unknown. + +Liam moved the plum to the red_drawer, so we can eliminate any options where the plum is located. + +Benjamin lost his phone, so we can eliminate any options where the plum or tangerine are located since he would have been preoccupied with finding his phone instead of moving fruit. + +Therefore, the only option left is where the tangerine was last moved by Sophia, which is the green_bottle. + +So, Jackson thinks Carter thinks Liam thinks Benjamin thinks the tangerine is in the green_bottle. The answer is L. green_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_17/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4bf09dc65c90280e6ddbdff933feaead50fdcc55 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_17/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where is the lime really? +Answer: green_pantry +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: To answer this question, we need to track the movements of the lime and which agent moved it. According to the story, the lime was initially in the red_bottle, but Lily moved it to the blue_drawer. Then, Evelyn moved it to the green_pantry. Therefore, the lime is really in the green_pantry. The answer is B. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_17/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..897b6885e19b6e15e87cc17b87991606ee6fd6ed --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_17/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Owen really think the lime is? +Answer: blue_drawer +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: To solve this question, we need to track Owen's movements and any interactions he had with other agents regarding the lime. According to the story, Owen made no movements in the front yard and exited after one minute. Therefore, he did not interact with any other agents regarding the lime in the front yard. In the waiting room, Owen entered with Lily, Emily, Ella, and Evelyn, but there is no mention of any interactions regarding the lime. However, we know that Owen likes the blue drawer, which is where Lily moved the lime to. Therefore, based on the given assumptions, we can infer that Owen trusts Lily's claim and thinks that the lime is in the blue drawer. Therefore, the answer is C. blue_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_17/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9892d603500af8ebf9da9527d38496bcecef79ad --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_17/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Emily think Owen thinks the lime is? +Answer: blue_drawer +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: To answer this question, we need to track the movements of each agent and their interactions with each other. + +- Lily moved the lime from the red_bottle to the blue_drawer before exiting the front_yard. +- Ella liked the red_bottle but made no movements before exiting the front_yard. +- Owen made no movements before exiting the front_yard. +- Evelyn moved the lime to the green_pantry before exiting the front_yard. +- Emily made no movements before exiting the front_yard. + +Therefore, Emily did not witness the movement of the lime and does not know where it is. However, we can use the assumption that agents tend to trust those who exited the room later than themselves. + +Owen exited the front_yard after Emily, so she may trust his thoughts on the location of the lime. According to the story, Owen likes the blue_drawer, but Lily moved the lime from the red_bottle to the blue_drawer before exiting the front_yard. Therefore, Owen may think that the lime is in the blue_drawer. + +The answer is C. blue_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_17/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1a38422e67e41d56499c4b271a901bcec5652f3a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_17/order_3.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Lily think Emily thinks Owen thinks the lime is? +Answer: blue_drawer +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: To answer this question, we need to trace Lily's movements and interactions with the other agents. Lily initially moved the lime from the red_bottle to the blue_drawer. After Lily exited the front_yard, Ella and Owen stayed in the front_yard for a minute each without making any movements. Then, Evelyn moved the lime to the green_pantry before exiting the front_yard. Finally, Emily stayed in the front_yard for a minute before exiting. + +Lily was not present when the lime was moved to the green_pantry, so she does not know that it is there. However, she knows that the lime is not in the red_bottle or the blue_drawer anymore. Since Owen likes the blue_drawer and Lily moved the lime from there, it is unlikely that Owen thinks the lime is in the blue_drawer. Additionally, Lily knows that Emily was in the front_yard after she left and before Emily left, so she may have overheard or had a private conversation with Emily about the lime's location. + +Based on these clues, Lily may think that Emily thinks Owen thinks the lime is in the red_bottle. This is because Ella liked the red_bottle and may have mentioned it to Emily, who then told Lily. However, since the agents tend to lie, this is not a definite answer. + +Therefore, the answer is A. red_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_17/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1a106d61af98df360cc032c9a1a0459de6e36ff0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_17/order_4.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Ella think Lily thinks Emily thinks Owen thinks the lime is? +Answer: blue_drawer +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Emily think the lime is? +- We know that Lily moved the lime from the red_bottle to the blue_drawer, so Emily should think the lime is in the blue_drawer. + +2. Where does Lily think Emily thinks the lime is? +- Lily was in the attic with Emily, but she didn't make any movements or statements about the lime. Therefore, we can't infer what Lily thinks Emily thinks about the lime. + +3. Where does Owen think the lime is? +- Owen was in the front_yard and didn't make any movements or statements about the lime. Therefore, we can't infer what Owen thinks about the lime. + +4. Where does Emily think Owen thinks the lime is? +- Emily didn't have any interactions with Owen, so we can't infer what she thinks he thinks about the lime. + +5. Where does Ella think Lily thinks Emily thinks Owen thinks the lime is? +- Ella was in the front_yard with Lily, but Lily didn't make any movements or statements about the lime while they were there. However, Lily did move the lime to the blue_drawer before leaving the front_yard. Therefore, Ella should think that Lily thinks Emily thinks Owen thinks the lime is in the blue_drawer. + +Answer: C. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_18/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..666b866c145a2f2ec68c71bf25570c3b509a90f3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_18/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where is the corn really? +Answer: blue_container +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To solve this question, we need to track the movements and statements of the agents related to the corn. According to the story, Sophia moved the corn to the blue_container, and Lily later moved the tomato to the green_drawer. Therefore, the corn is in the blue_container, which is option M. The correct answer is M. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_18/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..15f99a51fbe3ff602a7920695579877d0578f8db --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_18/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Noah really think the corn is? +Answer: blue_treasure_chest +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: To answer this question, we need to look for any information related to where Noah thinks the corn is. According to the story, we know that the corn is in the blue_treasure_chest, and Sophia moved it to the blue_container. However, there is no information about Noah's thoughts on the corn's location, except for the fact that he dislikes green pepper. Therefore, we cannot determine where Noah really thinks the corn is based on the given information. The answer is not provided in the options given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_18/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..88e4b9945c9752931e418766704d0f684d7736d9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_18/order_2.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Lily think Noah thinks the corn is? +Answer: blue_treasure_chest +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: To answer this question, we need to track Lily and Noah's movements and thoughts regarding the corn. According to the story, Lily made no movements in the staircase and stayed there for 1 minute. Noah dislikes the green pepper but there is no mention of his thoughts on the corn. However, we know that Sophia moved the corn to the blue container. Lily then entered the front yard with Isla and Sophia, and moved the tomato to the green drawer. Finally, Lily and the others entered the waiting room. + +Based on Lily's movements and the assumption that she tends to lie, we cannot trust her claims about where she thinks Noah thinks the corn is. However, we can infer that Noah might think the corn is in the blue container since that is where Sophia moved it. Therefore, the answer is M. blue_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_18/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..139f539a20b8eed059a07e0e720a2ddeb50f05f3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_18/order_3.txt @@ -0,0 +1,53 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Isla think Lily thinks Noah thinks the corn is? +Answer: blue_treasure_chest +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Where does Isla think Lily thinks Noah thinks the corn is? + +2. Isla and Lily were both in the front yard where the tomato is located, but there is no mention of them discussing the corn or Noah's thoughts. + +3. Noah dislikes the green pepper, but there is no mention of him having any thoughts about the corn. + +4. Sophia moved the corn to the blue container, but there is no mention of her discussing it with anyone else. + +5. Lily moved the tomato to the green drawer, but there is no mention of her discussing the corn or Noah's thoughts. + +6. Isla made no movements in the staircase or waiting room, so there is no information about her thoughts on the corn or Noah's thoughts. + +7. Based on the story and assumptions, we can infer that Isla and Lily did not have any private or public interactions where they discussed the corn or Noah's thoughts. + +8. Therefore, we cannot determine where Isla thinks Lily thinks Noah thinks the corn is. + +9. The answer is none of the above (N/A). + +In summary, this question requires careful analysis of the story and assumptions, and the answer cannot be determined based on the given information. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_18/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c2f649dce8679709bb34d6575ccd96ac592da077 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_18/order_4.txt @@ -0,0 +1,85 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Mila think Isla thinks Lily thinks Noah thinks the corn is? +Answer: blue_treasure_chest +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Mila entered the staircase with Isla, Noah, Sophia, and Lily. +2. The corn is in the blue_treasure_chest. +3. Mila made no movements and stayed in the staircase for 1 minute. +4. Mila exited the staircase. +5. Isla made no movements and stayed in the staircase for 1 minute. +6. Noah dislikes the green_pepper. +7. Isla exited the staircase. +8. Noah made no movements and stayed in the staircase for 1 minute. +9. Noah exited the staircase. +10. Sophia moved the corn to the blue_container. +11. Sophia exited the staircase. +12. Lily made no movements and stayed in the staircase for 1 minute. +13. Sophia dislikes the tomato. +14. Lily exited the staircase. +15. Mila, Isla, Noah, Sophia, and Lily entered the waiting_room. +16. Isla, Sophia, and Lily entered the front_yard. +17. The tomato is in the red_box. +18. Isla made no movements and stayed in the front_yard for 1 minute. +19. Isla exited the front_yard. +20. Sophia made no movements and stayed in the front_yard for 1 minute. +21. Sophia exited the front_yard. +22. Lily moved the tomato to the green_drawer. +23. Lily exited the front_yard. +24. Isla, Sophia, and Lily entered the waiting_room. + +Based on the story and assumptions, we can infer the following: + +- Mila knows that the corn is in the blue_treasure_chest. +- Mila knows that Sophia moved the corn to the blue_container. +- Mila knows that Sophia dislikes the tomato. +- Mila knows that the tomato is in the red_box. +- Mila knows that Lily moved the tomato to the green_drawer. +- Mila knows that Isla stayed in the front_yard for 1 minute and then left. +- Mila does not know what Noah thinks about the corn. + +Now let's break down the question: + +- Mila thinks Isla thinks Lily thinks Noah thinks the corn is in a certain location. +- We need to determine which location Mila thinks Isla thinks Lily thinks Noah thinks the corn is in. + +To solve this question, we need to work backwards from Mila to Noah to Lily to Isla. Here's the reasoning: + +- Mila does not know what Noah thinks about the corn, so she cannot base her answer on his thoughts. +- Lily moved the tomato to the green_drawer, so Mila knows that Lily does not think the corn is in the green_drawer. +- Isla stayed in the front_yard for 1 minute and then left, so Mila does not know what Isla thinks about the corn. +- Therefore, Mila must base her answer on what she thinks Lily thinks about the corn. +- Sophia dislikes the tomato, so Mila knows that Sophia does not think the corn is in the red_box. +- Sophia moved the corn to the blue_container, so Mila knows that Sophia does not think the corn is in the blue_treasure_chest. +- Therefore, Mila must think that Lily thinks Noah thinks the corn is in the blue_treasure_chest. + +Based on this reasoning, the answer is (E) blue_suitcase. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_19/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..48dc5349f60686781ca53dab84371c653e544259 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_19/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where is the tomato really? +Answer: blue_container +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to track the movements of the tomato and the agents. According to the story, Sophia moved the tomato to the blue_cupboard, then Jackson moved it to the blue_crate, and finally Nathan moved it back to the blue_container. Therefore, the tomato is in the blue_container. The answer is K. blue_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_19/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..34dbd0fb4fcad6760ce53c380dd5515a76978c36 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_19/order_1.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Jackson really think the tomato is? +Answer: blue_crate +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To answer this question, we need to track Jackson's movements and any interactions he had with other agents. According to the story, Jackson moved the tomato to the blue_crate and then exited the laundry. He later entered the hall with Nathan and Amelia, where he moved the onion to the red_envelope and saw a mouse. Amelia then exited the hall, and Jackson lost his phone. Finally, Jackson, Nathan, and Amelia entered the waiting_room. + +Based on these movements and interactions, we can infer that Jackson did not have any private or public interactions with Sophia, who moved the tomato to the blue_cupboard before exiting the laundry. Therefore, he would not know that the tomato was moved to the blue_cupboard. Additionally, he did not have any interactions with Charlotte, who made no movements in the laundry, or with Nathan, who moved the tomato to the blue_container after Jackson had already left the laundry. + +Therefore, the only place where Jackson could have seen the tomato is in the blue_crate, where he moved it before leaving the laundry. Therefore, Jackson really thinks the tomato is in the L. blue_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_19/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1ebeea452dbe19b5ca7266eae99df85280fce85a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_19/order_2.txt @@ -0,0 +1,66 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Nathan think Jackson thinks the tomato is? +Answer: blue_crate +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: The question is asking about Nathan's thoughts regarding Jackson's thoughts on the location of the tomato. To answer this question, we need to track the movements of the tomato and the agents. + +1. Sophia, Jackson, Amelia, Charlotte, and Nathan entered the laundry. +2. The tomato is in the blue_container. +3. Sophia moved the tomato to the blue_cupboard. +4. Sophia exited the laundry. +5. Jackson moved the tomato to the blue_crate. +6. Jackson exited the laundry. +7. Amelia made no movements and stayed in the laundry for 1 minute. +8. Amelia exited the laundry. +9. Charlotte made no movements and stayed in the laundry for 1 minute. +10. Charlotte exited the laundry. +11. Nathan moved the tomato to the blue_container. +12. Nathan exited the laundry. +13. Sophia, Jackson, Amelia, Charlotte, and Nathan entered the waiting_room. +14. Nathan, Jackson, and Amelia entered the hall. +15. The onion is in the blue_treasure_chest. +16. Nathan made no movements and stayed in the hall for 1 minute. +17. Nathan exited the hall. +18. Jackson moved the onion to the red_envelope. +19. Jackson exited the hall. +20. Amelia moved the onion to the green_cupboard. +21. Jackson saw a mouse. +22. Amelia exited the hall. +23. Jackson lost his phone. +24. Nathan, Jackson, and Amelia entered the waiting_room. + +Based on the story, Nathan moved the tomato to the blue_container after Jackson moved it to the blue_crate. Therefore, Nathan knows that the tomato is not in the blue_crate. + +We don't have any information about private or public interactions between Nathan and Jackson, so we can't assume that Nathan knows Jackson's thoughts on the location of the tomato. However, we do know that Nathan exited the hall after Jackson, so he may be more likely to trust Jackson's thoughts on the location of the tomato. + +From the story, we know that the tomato was last seen in the blue_crate before Jackson exited the laundry. Therefore, Nathan may think that Jackson thinks the tomato is still in the blue_crate. + +The answer is L. blue_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_19/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9bced24226f9b81e0d9a1c83dd842cb3b0f8dcb0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_19/order_3.txt @@ -0,0 +1,73 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Amelia think Nathan thinks Jackson thinks the tomato is? +Answer: blue_crate +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Amelia think Nathan thinks Jackson thinks the tomato is? + +2. We need to determine the location of the tomato according to each agent's movements and statements. + +3. Sophia moved the tomato to the blue_cupboard, and Jackson moved it to the blue_crate. + +4. Nathan moved the tomato back to the blue_container. + +5. Therefore, Nathan must have known that the tomato was originally in the blue_cupboard, and Jackson moved it to the blue_crate. + +6. Amelia made no movements in the laundry, so she does not have any direct knowledge of the tomato's location. + +7. Charlotte also made no movements in the laundry, so she does not have any direct knowledge of the tomato's location. + +8. Nathan, Jackson, and Amelia entered the hall, where the onion is located in the blue_treasure_chest. + +9. Nathan made no movements in the hall, so he does not have any direct knowledge of the onion's location. + +10. Jackson moved the onion to the red_envelope. + +11. Amelia moved the onion to the green_cupboard. + +12. Jackson saw a mouse and lost his phone, but these events are not relevant to the question. + +13. Nathan, Jackson, and Amelia then entered the waiting_room. + +14. Based on the movements and statements of the agents, we can conclude that Nathan knows the tomato was originally in the blue_cupboard, and Jackson moved it to the blue_crate. + +15. Amelia does not have any direct knowledge of the tomato's location, but she knows that Nathan knows it was in the blue_cupboard and Jackson moved it to the blue_crate. + +16. We need to determine where Amelia thinks Nathan thinks Jackson thinks the tomato is. + +17. Since Nathan knows the tomato was originally in the blue_cupboard and Jackson moved it to the blue_crate, he must think the tomato is in the blue_crate. + +18. Amelia knows that Nathan knows the tomato was originally in the blue_cupboard and Jackson moved it to the blue_crate, so she must think that Nathan thinks Jackson thinks the tomato is in the blue_crate. + +19. Therefore, the answer is L. blue_crate. + +So, the answer is L. blue_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_19/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0b10038fc8951ce80731ec6bc1ba1f5f0ec5cec1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_19/order_4.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Sophia think Amelia thinks Nathan thinks Jackson thinks the tomato is? +Answer: blue_cupboard +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Nathan think the tomato is? +- We know that Nathan moved the tomato to the blue_container before leaving the laundry. Therefore, Nathan thinks the tomato is in the blue_container. + +2. Where does Jackson think the tomato is? +- We know that Jackson moved the tomato to the blue_crate after Sophia left the laundry. Therefore, Jackson thinks the tomato is in the blue_crate. + +3. Where does Nathan think Jackson thinks the tomato is? +- We don't have enough information to answer this question. Nathan left the laundry before Jackson moved the tomato to the blue_crate, so he doesn't know where Jackson put it. We can only assume that Nathan thinks Jackson still believes the tomato is in the blue_container. + +4. Where does Amelia think Nathan thinks Jackson thinks the tomato is? +- We don't have any information about Amelia's thoughts on the tomato's location. However, we know that Amelia moved the onion to the green_cupboard in the hall. This means that she was in the same room as Jackson when he saw the mouse and lost his phone. Therefore, she may have overheard or witnessed something that could give her insight into Jackson's thoughts. + +5. Where does Sophia think Amelia thinks Nathan thinks Jackson thinks the tomato is? +- Sophia moved the tomato from the blue_container to the blue_cupboard before leaving the laundry. Therefore, she thinks the tomato is in the blue_cupboard. However, we don't have any information about her thoughts on Amelia's or Nathan's beliefs about the tomato's location. + +Based on the information given, we can't determine where Sophia thinks Amelia thinks Nathan thinks Jackson thinks the tomato is. The answer is not provided in the multiple-choice options. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_2/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..eee1419b42723612e6b4f966ab2ad5e6bcca242c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_2/order_0.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where is the corn really? +Answer: red_basket +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To answer this question, we need to follow the movements of the agents and the location of the corn. According to the story, the corn was initially in the red_basket (step 2). Liam moved the corn to the red_container (step 3) before exiting the hallway (step 4). Sophia and Lily made no movements and stayed in the hallway for 1 minute each (steps 5 and 7), while Carter made no movements and stayed in the hallway for 1 minute (step 9). Amelia moved the corn back to the red_basket (step 11) before exiting the hallway (step 12). Therefore, the corn is in the red_basket, which is option B. + +The correct answer is B. red_basket. + +a: \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_2/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5909782b89e95dcda541f5a7dea2ee7ab7b2dc4b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_2/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Amelia really think the corn is? +Answer: red_basket +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To answer this question, we need to trace Amelia's movements and actions related to the corn. According to the story, Amelia moved the corn to the red_basket before exiting the hallway. Therefore, Amelia really thinks that the corn is in the red_basket. The answer is B. red_basket. + +a: \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_2/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c36d5a311eb09b4c6e6f8328d0da1399daa75a77 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_2/order_2.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Lily think Amelia thinks the corn is? +Answer: red_container +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: To answer this question, we need to track the movements of Amelia and the corn. According to the story, Amelia moved the corn to the red_basket before exiting the hallway. Lily entered the hallway after Amelia had left, so she did not witness Amelia moving the corn. However, Lily did witness Liam moving the melon to the red_basket before he exited the hallway. Therefore, Lily may assume that Amelia also put the corn in the red_basket since Liam put the melon there. + +The answer is B. red_basket. + +a: 1 5 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_2/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a4b3c044702dd2e45b795111406d2aa08706d58b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_2/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Sophia think Lily thinks Amelia thinks the corn is? +Answer: red_container +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Where does Sophia think Lily thinks Amelia thinks the corn is? + +2. We know that Sophia and Lily were both in the hallway at different times, but we don't know if they had any private or public interactions. Therefore, Sophia cannot infer Lily's thoughts about the corn. + +3. Lily was in the hallway with Liam and Carter when they moved the melon. She then exited the hallway and we don't know where she went. Therefore, Lily cannot have any knowledge of where Amelia thinks the corn is. + +4. Amelia moved the corn to the red_basket before entering the waiting_room with Liam, Sophia, Lily, and Carter. Therefore, Amelia thinks the corn is in the red_basket. + +5. Since Sophia cannot infer Lily's thoughts and Lily cannot have any knowledge of where Amelia thinks the corn is, we cannot determine where Sophia thinks Lily thinks Amelia thinks the corn is. + +Therefore, the answer is none of the above. + +a: 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_2/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ec15ad3a75135e13f5075c290d4ae1d760042e82 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_2/order_4.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Liam think Sophia thinks Lily thinks Amelia thinks the corn is? +Answer: red_container +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Liam moved the corn to the red_container, so he knows the corn is in the red_container. +2. Sophia made no movements and stayed in the hallway for 1 minute, so she doesn't know where the corn is. +3. Lily made no movements and stayed in the hallway for 1 minute, so she doesn't know where the corn is. +4. Carter made no movements and stayed in the hallway for 1 minute, so he doesn't know where the corn is. +5. Amelia moved the corn to the red_basket, but Liam, Sophia, Lily, and Carter were not present when she did this, so they don't know where the corn is now. +6. Liam, Lily, and Carter entered the hallway again, and Liam moved the melon to the red_basket. So Liam knows that the melon is in the red_basket, but he still doesn't know where the corn is. +7. Lily moved the melon to the green_pantry, but Liam and Carter were not present when she did this, so they don't know where the melon is now. +8. Carter moved the melon to the red_container, so he knows that the melon is in the red_container. +9. Sophia dislikes the corn, but we don't know where she thinks it is. +10. Liam, Lily, and Carter entered the waiting_room, but they didn't discuss the location of the corn or the melon with each other. + +Based on these steps, we can eliminate options A, E, G, I, M, N, and O because there is no evidence that any of the characters know or think that the corn is in any of these locations. We can also eliminate options D, F, H, and K because they are not mentioned in the story at all. + +That leaves us with options B (red_basket) and C (red_container). Liam knows that the corn was originally in the red_basket, but he doesn't know that Amelia moved it to the red_container. Sophia, Lily, and Carter don't know where the corn is, so they could think it's still in the red_basket or they could have no idea. Since Liam exited the hallway before Amelia moved the corn, he would trust her less than he would trust someone who exited the hallway after her. Therefore, he might not believe that the corn is in the red_container, even if he knows that Amelia moved it there. + +So, the answer is B (red_basket). Liam thinks that Sophia thinks that Lily thinks that Amelia thinks the corn is still in the red_basket. + +a: 5 1 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_20/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..97b632920df5ee408b9b50b844143cf5f7254a87 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_20/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where is the peas really? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to track the movements of the peas and which agent moved it to which location. According to the story, the peas was initially in the blue_suitcase (statement 3). Emily moved the peas to the red_basket (statement 4), then Ella moved it to the red_envelope (statement 6), and finally Nathan moved it back to the blue_suitcase (statement 12). Therefore, the correct answer is A. blue_suitcase. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_20/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..67f557c2491a64f0bc76a2c6b2d73cbbbcc50d7f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_20/order_1.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Nathan really think the peas is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to track Nathan's movements and infer his thoughts based on the given assumptions. Nathan moved the peas to the blue suitcase after everyone else had exited the bathroom. Later, he entered the waiting room with the group and then went to the kitchen with Avery and Evelyn. While in the kitchen, he made no movements and stayed there for a minute before exiting. Based on the assumption that an agent tends to trust another agent who exited the room later than himself, we can assume that Nathan trusts Avery and Evelyn's claims about the location of the peas. + +From the story, we know that Emily moved the peas from the blue suitcase to the red basket, and Ella moved it from the red basket to the red envelope. Avery then moved it to the blue cupboard before Nathan moved it back to the blue suitcase. Therefore, Nathan knows that the peas is not in the blue cupboard or the red basket. + +There is no information about the green envelope, green basket, red crate, blue container, blue bucket, green bottle, blue treasure chest, red bucket, green box, or blue bathtub, so we can eliminate those options. The only option left is the red box, which is mentioned in the story as the location of the corn. + +Therefore, Nathan really thinks that the peas is in the red box. The answer is F. red_box. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_20/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9cfa139576034f558fc20343ce2c8da452a402a0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_20/order_2.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Emily think Nathan thinks the peas is? +Answer: red_basket +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To answer this question, we need to track the movements of the peas and the agents. Emily moved the peas from the blue suitcase to the red basket, then exited the bathroom. Ella moved the peas from the red basket to the red envelope, then exited the bathroom. Avery moved the peas from the red envelope to the blue cupboard, then exited the bathroom. Nathan moved the peas from the blue cupboard to the blue suitcase, then exited the bathroom. + +Since Emily exited the bathroom before Nathan moved the peas to the blue suitcase, she would not know where Nathan moved the peas. However, we can infer where Nathan thinks the peas is based on his movements. Nathan moved the peas from the blue cupboard to the blue suitcase, so he must think the peas is in the blue cupboard before he moved it. + +Therefore, the answer to the question is A. blue_suitcase. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_20/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..736c32ac58d62b1a6d4641741e361e88f28d80c0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_20/order_3.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Ella think Emily thinks Nathan thinks the peas is? +Answer: red_basket +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To answer this question, we need to track the movements of the agents and their interactions. First, Emily moved the peas from the blue suitcase to the red basket. Then, Ella moved the peas from the red basket to the red envelope. Avery then moved the peas from the red envelope to the blue cupboard. Nathan moved the peas from the blue cupboard back to the blue suitcase. + +Since Ella moved the peas after Emily, she knows that Emily thinks the peas are in the red basket. However, Nathan moved the peas back to the blue suitcase after Emily moved them to the red basket. Therefore, Ella thinks that Nathan thinks the peas are in the blue suitcase. + +The answer is A. blue_suitcase. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_20/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..81c47a950c713ac6843a0f7c58f4f8694be9f377 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_20/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Evelyn think Ella thinks Emily thinks Nathan thinks the peas is? +Answer: red_basket +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Where does Nathan move the peas to? According to step 12, Nathan moves the peas to the blue suitcase. +2. Who enters the waiting room with Evelyn, Avery, and Nathan? According to step 14, Emily, Ella, Avery, Evelyn, and Nathan enter the waiting room together. +3. Who enters the kitchen with Evelyn, Avery, and Nathan? According to step 15, Evelyn, Avery, and Nathan enter the kitchen together. +4. Where is the corn located? According to step 16, the corn is in the red box. +5. Who exits the kitchen last? According to assumption 4, agents tend to trust an agent that exited the room later than themselves. Therefore, Nathan exits the kitchen last. +6. Who thinks the peas is in the red basket? According to step 4, Emily moves the peas to the red basket. However, we are not given any information about who thinks the peas is in the red basket. +7. Who thinks the peas is in the blue cupboard? According to step 8, Avery moves the peas to the blue cupboard. However, we are not given any information about who thinks the peas is in the blue cupboard. +8. Who thinks the peas is in the red envelope? According to step 6, Ella moves the peas to the red envelope. However, we are not given any information about who thinks the peas is in the red envelope. +9. Who thinks the peas is in the blue suitcase? According to step 12, Nathan moves the peas to the blue suitcase. However, we are not given any information about who thinks the peas is in the blue suitcase. +10. Who thinks the peas is in the green envelope, green basket, red crate, blue bathtub, blue container, blue bucket, green bottle, blue treasure chest, red bucket, or green box? There is no information in the story or assumptions that suggests any of the characters think the peas is in any of these locations. + +Based on the information we have, we cannot determine where Evelyn thinks Ella thinks Emily thinks Nathan thinks the peas is. The answer is none of the above. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_3/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c828d5e4394079f9b62d7e341538fc11d5fadf09 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_3/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where is the peas really? +Answer: blue_crate +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To answer this question, we need to track the movements of the peas and which agent moved it to which location. According to the story, the peas started in the green_drawer and was moved by Liam to the blue_container. Then, Noah moved the peas to the green_crate and Avery moved it to the blue_bucket. Finally, Mila moved the melon to the blue_suitcase. Therefore, the answer is C. blue_suitcase. + +a: 7 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_3/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4361d00fe827960379617f3f163e142c88a58afc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_3/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Benjamin really think the peas is? +Answer: blue_crate +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To answer this question, we need to track Benjamin's movements and any interactions he had with other agents regarding the location of the peas. According to the story, Benjamin made no movements after entering the workshop and stayed there for 1 minute before exiting. Therefore, he did not interact with any of the agents who moved the peas. We also do not have any information about Benjamin's private thoughts or conversations with other agents. Therefore, we cannot determine where Benjamin really thinks the peas is. The answer is unknown. + +a: 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_3/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..90101079196c2deb7bca9ede067d8d15f1171902 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_3/order_2.txt @@ -0,0 +1,59 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Noah think Benjamin thinks the peas is? +Answer: green_crate +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: Step 1: Identify the agents who have information about the location of the peas and their movements. + +Agents who have information about the location of the peas: Liam, Noah, Avery, Mila + +Agents who have made movements related to the peas: Liam, Noah, Avery, Mila + +Step 2: Identify the agents who have interacted with Benjamin. + +Noah, Liam, and Mila have interacted with Benjamin in the waiting room. + +Step 3: Determine the order of exits from the workshop. + +Liam exited first, followed by Noah, Avery, Mila, and Benjamin. + +Step 4: Determine the final location of the peas. + +The final location of the peas is the blue_crate. + +Step 5: Determine the possible locations that Benjamin could think the peas is in. + +Benjamin did not make any movements related to the peas, so he may not know the actual location of the peas. Therefore, he could think the peas is in any of the locations where the peas were previously located: green_drawer, blue_container, green_crate, or blue_bucket. + +Step 6: Determine where Noah thinks Benjamin thinks the peas is. + +Noah and Benjamin did not interact with each other, so Noah may not know what Benjamin thinks about the location of the peas. However, Noah exited the workshop after Benjamin, so he may trust Benjamin's judgment more than his own. Since Noah did not move the peas to the blue_bucket, he may not think that Benjamin thinks the peas is in the blue_bucket. Therefore, the most likely answer is that Noah thinks Benjamin thinks the peas is in the green_drawer or the green_crate. + +Answer: E. green_drawer or O. green_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_3/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..04b9f2e1b3807ee308dcc17596693e9d4336c83e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_3/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Liam think Noah thinks Benjamin thinks the peas is? +Answer: blue_container +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to trace Liam's movements and his interactions with the other agents. Liam moved the peas from the green_drawer to the blue_container and dislikes the peas. Noah then moved the peas to the green_crate before exiting the workshop. Avery moved the peas to the blue_bucket before exiting the workshop. Mila then moved the peas to the blue_crate before exiting the workshop. Benjamin made no movements with the peas and stayed in the workshop for 1 minute before exiting. + +Liam saw a dog and made no movements in the den for 1 minute before exiting. Mila moved the melon from the red_bucket to the blue_suitcase before exiting the den. Noah made no movements in the den for 1 minute before exiting. + +Based on the assumptions, Liam can only infer Benjamin's thoughts if they had private or public interactions or were in the same place. However, there is no mention of Liam and Benjamin having any interactions or being in the same place. Therefore, Liam cannot know what Benjamin thinks about the peas. + +Noah moved the peas to the green_crate before exiting the workshop, and Liam made no movements with the peas before exiting the workshop. Therefore, Liam cannot know where Noah thinks the peas are. + +So, the answer to the question is: Liam does not know where Noah thinks Benjamin thinks the peas are. None of the answer choices are correct. + +a: 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_3/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7c7c7328e79bc06d3b4595a80d7aa33c96389f7c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_3/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Avery think Liam thinks Noah thinks Benjamin thinks the peas is? +Answer: blue_container +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: First, we need to determine where Liam thinks the peas is. Liam moved the peas from the green_drawer to the blue_container and dislikes the peas. Therefore, Liam thinks the peas is in the blue_container. + +Next, we need to determine where Noah thinks the peas is. Noah moved the peas from the blue_container to the green_crate. However, we don't know if Noah saw Liam move the peas to the blue_container or if he thought the peas was originally in the green_drawer. Therefore, we cannot determine where Noah thinks the peas is. + +Now, we need to determine where Benjamin thinks the peas is. Benjamin made no movements and stayed in the workshop for 1 minute. Therefore, we don't have any information about where Benjamin thinks the peas is. + +Finally, we need to determine where Avery thinks Liam thinks Noah thinks Benjamin thinks the peas is. We know that Avery moved the peas from the blue_container to the blue_bucket. However, we don't know if Avery saw Liam move the peas to the blue_container or if he thought the peas was originally in the green_drawer. Therefore, we cannot determine where Avery thinks Liam thinks Noah thinks Benjamin thinks the peas is. + +Since we cannot determine the answer, the correct option is D. blue_cupboard. + +a: 5 6 7 9 2 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_4/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f99d73e35e1e9ee42f754d8f35d7691e66ac8ad9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_4/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where is the potato really? +Answer: blue_drawer +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: To answer this question, we need to track the movements of each agent and the potato. According to the story, Mila moved the potato to the red_basket, Isabella moved the potato to the green_bottle, and Jacob moved the potato to the blue_drawer. Therefore, the potato is really in the blue_drawer. The answer is B. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_4/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..317af4f7ea3042aa6d54aebc5ae8902300a6a118 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_4/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Isabella really think the potato is? +Answer: green_bottle +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to consider the movements of each agent and their potential interactions with each other. Isabella moved the potato to the green_bottle before exiting the crawlspace. We don't have any information about her interacting with any other agent who may have influenced her thoughts. Therefore, we can assume that Isabella really thinks the potato is in the green_bottle. The answer is C. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_4/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f9cbfd629d74940ebde1d65d30d2058d576b9ca8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_4/order_2.txt @@ -0,0 +1,59 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Chloe think Isabella thinks the potato is? +Answer: blue_drawer +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: Step 1: Identify the relevant information in the story. +- Evelyn, Chloe, Mila, Isabella, and Jacob entered the crawlspace. +- The potato was initially in the blue_drawer. +- Evelyn and Chloe stayed in the crawlspace for 1 minute each. +- Mila moved the potato to the red_basket. +- Isabella moved the potato to the green_bottle. +- Jacob moved the potato to the blue_drawer. +- Evelyn, Chloe, Mila, Isabella, and Jacob entered the waiting_room. + +Step 2: Determine the possible ways Chloe could have formed her belief about where Isabella thinks the potato is. +- Chloe could have directly asked Isabella where she thinks the potato is. +- Chloe could have overheard Isabella telling someone else where she thinks the potato is. +- Chloe could have observed Isabella moving the potato to a certain location. +- Chloe could have inferred where Isabella thinks the potato is based on her own observations and assumptions. + +Step 3: Use the assumptions to eliminate some possibilities. +- Chloe could not have directly asked Isabella where she thinks the potato is, as there is no mention of any private or public interactions between them. +- Chloe could not have overheard Isabella telling someone else where she thinks the potato is, as there is no mention of Isabella making any public claims about the potato's location. + +Step 4: Use the remaining information to determine where Chloe thinks Isabella thinks the potato is. +- Chloe did not move the potato herself, so she cannot have observed Isabella moving it. +- Chloe stayed in the crawlspace for 1 minute and made no movements, so she did not see Mila or Jacob move the potato. +- Evelyn also stayed in the crawlspace for 1 minute and made no movements, so she did not see Mila or Jacob move the potato either. +- Isabella moved the potato to the green_bottle before exiting the crawlspace. +- Jacob moved the potato to the blue_drawer after Isabella. + +Based on the assumptions and the information in the story, Chloe would likely trust Jacob's claim about the potato's location more than Isabella's, as Jacob exited the crawlspace after Isabella. Therefore, Chloe would think that Isabella thinks the potato is still in the green_bottle, even though it was actually moved to the blue_drawer by Jacob. + +Answer: C. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_4/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..17d93e23370872ad8222ee048d1b40d1844509e3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_4/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Evelyn think Chloe thinks Isabella thinks the potato is? +Answer: blue_drawer +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: To answer this question, we need to trace the movements of each agent and their interactions. Evelyn and Chloe entered the crawlspace and made no movements before exiting. Mila moved the potato to the red_basket and Isabella moved it to the green_bottle before Jacob moved it to the blue_drawer. Then, Evelyn, Chloe, Mila, Isabella, and Jacob entered the waiting_room. Later, Evelyn, Mila, and Jacob entered the closet and moved the watermelon to the blue_suitcase and then to the red_drawer before exiting. Based on these movements, we can infer that Evelyn and Chloe did not have any private or public interactions regarding the location of the potato. Therefore, Evelyn has no information about where Chloe thinks the potato is. We cannot answer this question with the given information. The answer is none of the options provided. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_4/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9ec6d52b44930e676b7ea5a22e6644bc4ef7415a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_4/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Jacob think Evelyn thinks Chloe thinks Isabella thinks the potato is? +Answer: blue_drawer +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: This question requires a lot of inference and deduction based on the given assumptions. Let's break it down step by step: + +1. Jacob moved the potato to the blue_drawer, so he knows where it is. +2. Isabella moved the potato to the green_bottle, but Jacob was not present when this happened, so he does not know this. +3. Mila moved the potato to the red_basket, but Jacob was not present when this happened, so he does not know this either. +4. Chloe did not move the potato, so she does not know where it is. +5. Evelyn did not move the potato, but she was present when Jacob moved it to the blue_drawer, so she knows where it is. + +Based on this information, we can infer that: + +- Jacob knows the potato is in the blue_drawer. +- Evelyn knows the potato is in the blue_drawer. +- Chloe does not know where the potato is. +- Mila and Isabella may or may not know where the potato is, but Jacob does not know their thoughts on this. + +Now let's look at the question again: Where does Jacob think Evelyn thinks Chloe thinks Isabella thinks the potato is? + +Since Jacob knows the potato is in the blue_drawer, he must think that Evelyn also knows this. As for Chloe and Isabella, Jacob does not know their thoughts on the location of the potato, so he cannot make any assumptions about what they think. Therefore, the answer to the question is B. blue_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_5/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1510e2fa1c3d039317bf32cb0804c469aa9e3d4c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_5/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where is the cabbage really? +Answer: green_envelope +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To answer this question, we need to follow the movements of the agents and the location of the cabbage. According to the story, the cabbage was initially in the green_envelope (step 2). Noah moved the cabbage to the green_box (step 3), and later Avery moved it back to the green_envelope (step 20). Therefore, the cabbage is really in the green_envelope. The answer is B. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_5/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..95a7e2f97e9614c29182bb5f0563cfdd3f60c40f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_5/order_1.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Avery really think the cabbage is? +Answer: green_envelope +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To answer this question, we need to track the movements of the cabbage and the statements made by the characters. According to the story, the cabbage was initially in the green_envelope (statement 2). Noah then moved the cabbage to the green_box (statement 3), and later Avery moved the cabbage back to the green_envelope (statement 20). We also know that Aiden likes the blue_bucket (statement 15) and that the cabbage is currently in the green_box (statement 17). + +Based on these statements, we can eliminate options D, E, F, G, H, I, J, K, L, M, N, and O as they are not related to the cabbage's location. We also know that Emma likes the red_envelope (statement 4), but there is no indication that Avery thinks the cabbage is in the red_envelope. + +Therefore, the correct answer is B. green_envelope, as Avery moved the cabbage to that location (statement 20). \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_5/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..253c4a36c9b535a27d015be0a86df5ed24aef8f5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_5/order_2.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Aiden think Avery thinks the cabbage is? +Answer: green_box +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: To answer this question, we need to track the movements of Aiden and Avery in relation to the cabbage. According to the story, the cabbage was initially in the green_envelope (step 2), but Noah moved it to the green_box (step 3). Later, Avery moved the cabbage back to the green_envelope (step 20). Aiden likes the blue_bucket (step 15), but there is no mention of him interacting with the cabbage until he enters the staircase with Avery and Jackson (step 16). At this point, the cabbage is in the green_box (step 17). Aiden makes no movements in the staircase (step 18) and exits after one minute (step 19). + +Based on these movements, Aiden would likely think that Avery thinks the cabbage is in the green_envelope, since that is where Avery moved it to (step 20) and Aiden did not witness any further movements of the cabbage. Therefore, the answer is B. green_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_5/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a5c5f1601157a79d14c715ae120c6e7c0f297fbe --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_5/order_3.txt @@ -0,0 +1,55 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Emma think Aiden thinks Avery thinks the cabbage is? +Answer: green_box +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: This question requires a lot of careful reading and deduction. Let's break it down step by step: + +1. Where does Emma think Aiden thinks Avery thinks the cabbage is? + +2. We know that Aiden likes the blue_bucket, but we don't know anything about where he thinks the cabbage is. + +3. Avery moved the cabbage to the green_envelope, so we know that's where it currently is. + +4. Emma likes the red_envelope, but we don't know anything about where she thinks the cabbage is. + +5. We know that Noah moved the cabbage to the green_box, but we don't know if any of the other characters know this. + +6. Emma and Aiden were both in the staircase, but we don't know if they had any interactions or if Emma overheard anything Aiden said. + +7. Avery and Jackson were also in the staircase, but we don't know if they had any interactions with Emma or Aiden. + +8. Aiden, Avery, and Jackson all entered the staircase together after the cabbage was moved to the green_box, so they all know where it currently is. + +9. Aiden, Avery, and Jackson all exited the staircase in that order, so they all trust each other's knowledge of where the cabbage is. + +10. Emma exited the staircase after Aiden, so she would trust his knowledge of where the cabbage is. + +Based on all of this information, we can deduce that Emma thinks Aiden thinks Avery thinks the cabbage is in the green_envelope, since that's where it currently is and Aiden would trust Avery's knowledge of its location. Therefore, the answer is B. green_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_5/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..dd35e45923a6bfa8e8bdacc3779137cd1423f8f0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_5/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Noah think Emma thinks Aiden thinks Avery thinks the cabbage is? +Answer: green_box +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Where does Noah think Emma thinks Aiden thinks Avery thinks the cabbage is? + +2. We know that Noah moved the cabbage to the green_box (step 3) and that the cabbage is still in the green_box when Aiden, Avery, and Jackson enter the staircase (step 17). Therefore, we can eliminate options E, F, J, L, M, N, and O. + +3. We also know that Emma likes the red_envelope (step 4) and that she made no movements in the staircase (step 6) before exiting (step 7). Therefore, we can eliminate options B, C, D, I, and K since Emma did not interact with the cabbage or express any thoughts about it. + +4. This leaves us with option A (red_envelope) and H (red_container). Since Emma likes the red_envelope, it is possible that she thinks the cabbage is in there. However, we cannot be sure since there is no evidence to suggest that Aiden or Avery have any thoughts about the cabbage. + +5. On the other hand, Noah may trust Jackson more than Emma since Jackson exited the staircase after him (step 13). If Jackson expressed any thoughts about the cabbage to Noah, he may believe that Avery moved it to the green_envelope (step 20) since Avery exited the staircase after Aiden and Jackson (step 23). This would lead Noah to believe that Emma thinks Aiden thinks Avery thinks the cabbage is in the green_envelope. + +6. Therefore, the answer is either A (red_envelope) or H (red_container), but we cannot be certain without more information about the private or public interactions between the characters. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_6/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e95bf84f082574f7230c94819e40a13d61f0fa11 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_6/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where is the melon really? +Answer: red_pantry +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: To answer this question, we need to track the movements of the melon and the agents. According to the story, the melon was initially in the red_pantry (statement 2). Owen moved the melon to the green_basket (statement 3), and Mila moved it to the green_box (statement 11). Finally, Noah moved the melon to the red_pantry (statement 13). Therefore, the melon is really in the red_pantry (option F). \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_6/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..968ccec8d175684d44ea7a7811460fb3a303d370 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_6/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Owen really think the melon is? +Answer: green_basket +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: To answer this question, we need to track Owen's movements with the melon. According to the story, Owen moved the melon from the red_pantry to the green_basket before exiting the bedroom. Therefore, Owen really thinks the melon is in the G) green_basket. The answer is G) green_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_6/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4c56c81afd2ce7e47552e500e86630d0b49a280e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_6/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Avery think Owen thinks the melon is? +Answer: green_basket +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: The question is asking about Avery's thoughts on where Owen thinks the melon is. To answer this question, we need to track the movements of Owen and the melon. + +1. Owen, Avery, Benjamin, Mila, and Noah entered the bedroom. +2. The melon is in the red_pantry. +3. Owen moved the melon to the green_basket. +4. Owen exited the bedroom. + +Based on the assumption that agents tend to trust those who exit a room later than themselves, Avery would trust Owen's movements more than Benjamin, Mila, or Noah's movements. Therefore, Avery would know that Owen moved the melon from the red_pantry to the green_basket before he exited the bedroom. + +So, where does Avery think Owen thinks the melon is? Avery would think that Owen thinks the melon is in the green_basket because that is where Owen left it before he exited the bedroom. + +Therefore, the answer is G. green_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_6/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..32e396760abde42b5139d5bc8377adc6e8f63678 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_6/order_3.txt @@ -0,0 +1,58 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Benjamin think Avery thinks Owen thinks the melon is? +Answer: green_basket +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Benjamin think Avery thinks Owen thinks the melon is? + +2. We know that Owen moved the melon from the red_pantry to the green_basket, but we don't know if Benjamin was present when this happened. + +3. Avery saw a monkey and made no movements for one minute before exiting the bedroom. This information doesn't seem relevant to the question. + +4. Owen likes the red_basket, but we don't know if this affects his thoughts about the melon's location. + +5. Benjamin made no movements and stayed in the bedroom for one minute before exiting. This means he was present when Owen moved the melon, but we don't know if he saw it happen or if he was paying attention. + +6. Mila moved the melon from the green_basket to the green_box, and Noah moved it from the green_box to the red_pantry. Again, this information doesn't seem relevant to the question. + +7. Noah, Avery, and Mila later moved to the dining_room and moved the sweet_potato from the red_basket to the green_bucket, then to the blue_container. This also doesn't seem relevant to the question. + +8. Owen saw a dog, and Mila made no movements for one minute before exiting the dining_room. Again, not relevant. + +9. Noah, Avery, and Mila then entered the waiting_room together. + +10. Based on the assumptions given, we know that Benjamin can only infer Avery's thoughts if they were in the same place or had private or public interactions. We don't know if this happened, so we can't make any assumptions about what Benjamin thinks Avery thinks. + +11. We do know that the melon ended up in the red_pantry, so it's possible that Benjamin thinks Owen thinks it's there. However, we don't have any information to suggest that Avery has any thoughts about the melon's location, so we can't make any assumptions about what Benjamin thinks Avery thinks. + +12. Therefore, the answer is impossible to determine based on the information given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_6/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a55e54a7dc9d93f21b50b22194f5fa27b646b25f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_6/order_4.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Noah think Benjamin thinks Avery thinks Owen thinks the melon is? +Answer: green_basket +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Noah think Benjamin thinks Avery thinks Owen thinks the melon is? + +2. First, we need to determine where the melon actually is. According to the story, the melon starts in the red_pantry (line 2), is moved to the green_basket by Owen (line 3), then to the green_box by Mila (line 11), and finally to the red_pantry by Noah (line 13). + +3. Next, we need to determine who has knowledge of the melon's location. Owen, Mila, and Noah all move the melon at some point, so they know where it is. Avery and Benjamin do not move the melon, but they are in the same room as it at some point, so they may have seen it. + +4. We also need to consider the trust relationships between the agents. Noah trusts Avery more than Benjamin (since Avery exited the room after him), and Benjamin trusts Owen more than Avery (since Owen exited the room after him). + +5. Finally, we need to consider the lying tendencies of the agents. We cannot assume that what they say is true. + +6. Putting all of this together, we can start to make some inferences. Since Noah moved the melon to the red_pantry, we know that he thinks the melon is in the red_pantry. However, he is trying to determine what Benjamin thinks Avery thinks Owen thinks, so we need to consider what each of those agents knows. + +7. Avery saw a monkey (line 5) and made no movements with the melon (line 6), so we cannot infer anything about what she thinks. Benjamin also made no movements with the melon (line 9), but he trusts Owen more than Avery, so he may think that the melon is in the red_basket (line 8). + +8. Owen moved the melon to the green_basket (line 3) and likes the red_basket (line 8), so we cannot be sure what he thinks. However, since Benjamin trusts him more than Avery, we can assume that Benjamin thinks Owen knows where the melon is. + +9. Putting all of this together, we can make an educated guess about what Noah thinks Benjamin thinks Avery thinks Owen thinks. Since Noah knows the melon is in the red_pantry, he may think that Benjamin thinks Avery thinks Owen thinks the melon is in the red_basket (since Benjamin trusts Owen more than Avery and Owen moved the melon to the green_basket). Therefore, the answer is A. red_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_7/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..51e7c654f3cc937e91619d737604d256a5d7c73d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_7/order_0.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where is the melon really? +Answer: blue_treasure_chest +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: To answer this question, we need to track the movements of the melon throughout the story. According to the story, the melon was initially in the blue_container when Evelyn, Isabella, Nathan, Ava, and Lily entered the hallway. Evelyn then moved the melon to the green_treasure_chest before exiting the hallway. Nathan later moved the melon to the blue_treasure_chest before exiting the hallway. Therefore, the melon is in the blue_treasure_chest, which is option N. + +The correct answer is N. blue_treasure_chest. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_7/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..05aa000ef6ea870ce5861219db28c7b9bb42f169 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_7/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Nathan really think the melon is? +Answer: blue_treasure_chest +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: To answer this question, we need to track Nathan's movements and the movements of the melon. According to the story, Nathan moved the melon to the blue_treasure_chest before exiting the hallway. Therefore, Nathan really thinks the melon is in the blue_treasure_chest. The answer is N. blue_treasure_chest. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_7/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..38ed3d7620eb294fb2fa9788358fef1932306739 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_7/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Lily think Nathan thinks the melon is? +Answer: blue_treasure_chest +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: The question is asking about Lily's thoughts on where Nathan thinks the melon is. To answer this question, we need to trace Nathan's movements with the melon and determine where Lily was during those movements. + +According to the story, Nathan moved the melon to the blue_treasure_chest before exiting the hallway. Lily was still in the hallway at this point and made no movements. Therefore, Lily would have seen Nathan move the melon to the blue_treasure_chest. + +Based on Lily's known dislikes (cucumber and spinach), we can eliminate options J, K, N, O, and H. We can also eliminate options A, F, and M as they are not mentioned in the story. + +Isabella made no movements and stayed in the hallway for 1 minute, so she did not interact with Nathan or the melon. Therefore, we can eliminate options B, C, D, and E as they involve Isabella's movements with the spinach. + +This leaves us with option G, the red_crate, as the only remaining option. Therefore, Lily thinks Nathan thinks the melon is in the red_crate. + +The answer is G. red_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_7/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b32268a62dafdadf06c115ec94d0ce4c103fa249 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_7/order_3.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Isabella think Lily thinks Nathan thinks the melon is? +Answer: green_treasure_chest +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Where does Isabella think Lily thinks Nathan thinks the melon is? + +2. We know that Nathan moved the melon to the blue_treasure_chest, but we don't know if Lily or Isabella were present when he did so. + +3. Isabella made no movements and stayed in the hallway for 1 minute, so she did not witness Nathan moving the melon. + +4. Lily made no movements and stayed in the hallway for 1 minute, so she also did not witness Nathan moving the melon. + +5. However, we do know that Evelyn moved the melon to the green_treasure_chest before she exited the hallway. Isabella may have witnessed this, but we don't know for sure. + +6. We also know that Lily dislikes the cucumber, but this information is not relevant to the question. + +7. Based on the assumptions, Isabella can only infer Nathan's thoughts if she had private or public interactions with him. We don't know if this happened, so we can't assume that Isabella knows what Nathan thinks. + +8. We also don't know if Lily has any thoughts about where the melon is, since she did not witness Nathan or Evelyn moving it. + +9. Therefore, we cannot determine where Isabella thinks Lily thinks Nathan thinks the melon is. + +10. The answer is: Insufficient information to determine. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_7/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..867c2346d8a4c1ee1528a387ca34671d6d3ef846 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_7/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Ava think Isabella thinks Lily thinks Nathan thinks the melon is? +Answer: green_treasure_chest +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Nathan think the melon is? +- According to the story, Nathan moved the melon to the blue_treasure_chest before exiting the hallway. Therefore, Nathan thinks the melon is in the blue_treasure_chest. The answer is J. + +2. Where does Lily think the cucumber is? +- Lily dislikes the cucumber, but there is no information about where it is located. Therefore, we cannot answer this question. + +3. Where does Isabella think the melon is? +- Isabella made no movements with the melon, but she was in the hallway with Evelyn, who moved the melon to the green_treasure_chest before exiting. Isabella then exited the hallway and did not interact with Nathan, who moved the melon to the blue_treasure_chest. Therefore, Isabella thinks the melon is in the green_treasure_chest. The answer is O. + +4. Where does Ava think Isabella thinks Lily thinks Nathan thinks the melon is? +- This question requires multiple inferences. We know that Ava dislikes the spinach, which was moved to the blue_bottle by Nathan and then to the red_bottle by Isabella. Therefore, Ava knows that the spinach is in the red_bottle. We also know that Lily dislikes the cucumber, but we don't know where it is located. Therefore, we cannot use this information to infer anything about Lily's thoughts. However, we know that Isabella thinks the melon is in the green_treasure_chest, as we determined in the previous question. Finally, we know that Nathan thinks the melon is in the blue_treasure_chest. Since Ava exited the hallway after Nathan, she trusts Nathan more than Isabella. Therefore, she thinks that Isabella thinks the melon is in the blue_treasure_chest. The answer is N. + +Therefore, the answer is N. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_8/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..97fd676edeace88f55c345c5489a7357eacc10cb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_8/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where is the watermelon really? +Answer: blue_treasure_chest +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: To answer this question, we need to trace the movements of each agent and their interactions with the watermelon. According to the story, Emma moved the watermelon to the blue_treasure_chest and then exited the hall. Therefore, the correct answer is E. blue_treasure_chest. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_8/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e5e08f1e382dd3487e67c773065c29fc03851da7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_8/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Noah really think the watermelon is? +Answer: blue_treasure_chest +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: To answer this question, we need to look at the movements and actions of each agent in relation to the watermelon. Noah and Abigail entered the hall together, but neither of them moved the watermelon. Emma moved the watermelon to the blue_treasure_chest after Abigail left the hall. Liam entered the hall after Emma and did not move the watermelon. Noah re-entered the hall after Liam saw a dog, but he did not move the watermelon. Therefore, based on the given information, Noah never interacted with the watermelon and made no movements towards it. We can assume that he did not have any private or public interactions with anyone who moved the watermelon either. Therefore, we cannot determine where Noah really thinks the watermelon is. The answer is not provided in the given options. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_8/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..15c987c6bedd5417818012040aa304ba263a2992 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_8/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Emma think Noah thinks the watermelon is? +Answer: green_bucket +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: To answer this question, we need to track the movements of Emma and Noah in relation to the watermelon. Emma dislikes the melon and moves it to the blue_treasure_chest. Noah makes no movements and stays in the hall for 1 minute before exiting. Therefore, Emma has no interaction with Noah regarding the watermelon's location. We cannot infer where Emma thinks Noah thinks the watermelon is because there is no evidence of any interaction or communication between them. The answer is not provided in the given options. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_8/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4fd528a0e7d001147cf5ca2c4e82c89420f27218 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_8/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Liam think Emma thinks Noah thinks the watermelon is? +Answer: green_bucket +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: This question requires a lot of careful reading and analysis. We need to determine where Liam thinks Emma thinks Noah thinks the watermelon is. + +First, we need to identify the relevant agents in this scenario. These are Noah, Abigail, Owen, Emma, and Liam. + +Next, we need to look at the actions of each agent and their movements. We know that the watermelon was initially in the green_bucket, but Emma moved it to the blue_treasure_chest. We also know that Noah made no movements in the hall where the watermelon was located, and Liam did not enter the hall until after the watermelon had been moved. + +Based on these actions, we can eliminate some of the answer choices. We know that Liam did not witness the watermelon being moved to the blue_treasure_chest, so he cannot think that Noah thinks it is there. We can also eliminate any answer choices that do not involve the green_bucket or the blue_treasure_chest. + +Now we need to consider Liam's thought process. We know that he saw a dog in the hall where the persimmon was located, but we don't have any information about his thoughts on the watermelon. However, we do know that Emma moved the watermelon to the blue_treasure_chest, and Liam was the last agent to exit the hall where the watermelon was located. + +Based on the assumption that agents tend to trust those who exit a room later than themselves, we can assume that Liam trusts Emma's actions and believes that she moved the watermelon to the blue_treasure_chest for a reason. Therefore, he may think that Noah also believes the watermelon is in the blue_treasure_chest, since he did not make any movements in the hall. + +However, we also need to consider the fact that agents tend to lie and that Liam's thoughts may not be accurate. Therefore, we cannot be certain of the answer without more information. + +Based on this analysis, the answer is E. blue_treasure_chest, but with the caveat that Liam's thoughts may not be reliable. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_8/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..584818c58e467b9a7b09d6b28853d61d03015ad9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_8/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Owen think Liam thinks Emma thinks Noah thinks the watermelon is? +Answer: green_bucket +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: This question requires a lot of steps to solve. Let's break it down: + +1. Owen moved the persimmon to the green_crate, so he knows where it is. +2. Liam saw a dog, so he didn't see where the persimmon was moved to. +3. Liam made no movements in the hall, so he didn't move the persimmon to the green_bathtub. +4. Emma moved the watermelon to the blue_treasure_chest, so she knows where it is. +5. Emma dislikes the melon, so she wouldn't think it's in the blue_treasure_chest. +6. Noah made no movements in the hall, so he doesn't know where the watermelon is. +7. Abigail made no movements in the hall, so she doesn't know where the watermelon is. +8. Owen made no movements in the hall before moving the persimmon, so he doesn't know where the watermelon is. +9. Liam made no movements in the hall before seeing the dog, so he doesn't know where the watermelon is. +10. Owen exited the hall after Noah, so he trusts Noah's exit order and thinks Noah knows where the watermelon is. +11. Liam exited the hall after Owen, so he trusts Owen's exit order and thinks Owen knows where the watermelon is. +12. Emma exited the hall before Liam, so Liam doesn't trust her and doesn't think she knows where the watermelon is. + +Putting all of this together, we can conclude that Owen thinks Liam thinks Noah thinks the watermelon is in the green_bucket (option A). \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_9/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b4d888c7283d4af034fe4bfa1ee814e6a38b629 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_9/order_0.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where is the carrot really? +Answer: red_basket +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To answer this question, we need to trace the movements of each agent and the carrot. According to the story, Evelyn moved the carrot to the red_pantry, then exited the hall. Mila made no movements and stayed in the hall for 1 minute before exiting. Owen then moved the carrot to the green_drawer before exiting the hall. Lily moved the carrot to the red_envelope before exiting the hall. Finally, Noah moved the carrot to the red_basket before exiting the hall. Therefore, the carrot is really in the red_basket. The answer is A. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_9/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e1fd8774d9881402ea5a90c955ebf752aff4345d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_9/order_1.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Noah really think the carrot is? +Answer: red_basket +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To answer this question, we need to track Noah's movements and any interactions he had with the carrot. According to the story, Noah entered the hall with Evelyn, Mila, Owen, and Lily. He then moved the carrot to the red_basket before exiting the hall. Later, he entered the sunroom with Mila and Owen, but made no movements and stayed there for 1 minute before exiting. Finally, he entered the waiting_room with Mila and Owen. + +Based on the assumption that agents tend to trust those who exited a room later than themselves, we can assume that Noah trusts Owen's claim that he likes the green_treasure_chest. However, there is no information to suggest that Noah had any private or public interactions with any of the other agents regarding the carrot's location. + +Therefore, we can conclude that Noah really thinks the carrot is in the red_basket, as that is where he moved it to and there is no evidence to suggest that he changed his mind or had any interactions that would lead him to believe otherwise. The answer is A. red_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_9/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a71f97f74c002a3475607aeda1fd83c5802b2b6e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_9/order_2.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Owen think Noah thinks the carrot is? +Answer: green_drawer +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: To answer this question, we need to track the movements of Owen and Noah with respect to the carrot. According to the story, Owen moved the carrot to the green_drawer and Noah moved it to the red_basket. We also know that Owen likes the red_basket and dislikes the spinach. However, we don't have any information about what Noah likes or dislikes. + +Based on the assumptions given, we can infer that Owen trusts Noah more than Mila because Noah exited the sunroom after Owen did. Therefore, Owen is more likely to believe Noah's claim about the location of the carrot. + +Since Noah moved the carrot to the red_basket and we don't have any conflicting information, we can assume that Owen thinks Noah thinks the carrot is in the red_basket. Therefore, the answer is A. red_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_9/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..124708b3e2ae0e85eebba9119901c6f422e95374 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_9/order_3.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Mila think Owen thinks Noah thinks the carrot is? +Answer: red_pantry +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Mila saw Owen move the carrot to the green_drawer. +2. Mila exited the hall. +3. Owen likes the red_basket. +4. Noah moved the carrot to the red_basket. +5. Mila, Owen, and Noah entered the waiting_room. + +Based on these steps, we can infer that Mila knows that Owen moved the carrot to the green_drawer, but she doesn't know that Noah moved it to the red_basket. However, she knows that Owen likes the red_basket, so she might think that he believes the carrot is still there. + +Now we need to consider what Mila thinks Owen thinks Noah thinks. Mila didn't witness any interactions between Owen and Noah regarding the carrot, so she can only make assumptions based on what she knows about their preferences and movements. + +We know that Owen likes the red_basket, but we don't know what he thinks about the carrot's location after Noah moved it. Mila dislikes spinach, but we don't know how that affects her perception of the carrot's location. + +Therefore, we can't determine with certainty where Mila thinks Owen thinks Noah thinks the carrot is. The answer is inconclusive. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_9/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..bb8e10cd2e62e4f853f3d371c54c11bd52fb1c51 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_2/sample_9/order_4.txt @@ -0,0 +1,55 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Lily think Mila thinks Owen thinks Noah thinks the carrot is? +Answer: red_pantry +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Where does Lily think Mila thinks Owen thinks Noah thinks the carrot is? + +2. We need to start with Noah, who moved the carrot last. According to assumption (4), Lily will trust Owen's opinion more than Noah's because Owen exited the room after Noah. So, we need to determine where Owen thinks the carrot is. + +3. Owen moved the carrot to the green_drawer, so he thinks the carrot is in the green_drawer. + +4. According to assumption (2), Mila can only infer Owen's thought if she has been in the same place as Owen or has had private or public interactions with him. Mila was in the hall when Owen moved the carrot, but we don't know if they had any interactions. Therefore, we cannot determine where Mila thinks the carrot is based on Owen's opinion. + +5. According to assumption (4), Lily will trust Mila's opinion more than Owen's because Mila exited the room after Owen. So, we need to determine where Mila thinks the carrot is. + +6. Mila made no movements in the hall, so we cannot determine where she thinks the carrot is based on her actions. + +7. However, we do know that Mila dislikes spinach (according to step 20), and the only option that mentions spinach is the green_drawer (where Owen thinks the carrot is). Therefore, Lily may think that Mila thinks Owen thinks the carrot is in the green_drawer. + +8. Finally, according to assumption (2), Lily can only infer Mila's thought if she has been in the same place as Mila or has had private or public interactions with her. Lily was in the hall and the waiting_room with Mila, but we don't know if they had any interactions. Therefore, we cannot determine where Lily thinks Mila thinks Owen thinks Noah thinks the carrot is. + +9. Based on the above analysis, the answer is B. green_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_1/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a702660ed2e0cce7e92e242a33f0e414ca7ad119 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_1/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where is the lettuce really? +Answer: blue_container +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to track the movements of the lettuce and the agents who moved it. According to the story, the lettuce was initially in the blue_container in the back yard. Nathan moved it to the green_cupboard before exiting the back yard. Logan then moved it to the blue_treasure_chest before exiting the back yard. Abigail then moved it to the red_basket before exiting the back yard. Finally, Isabella moved it back to the blue_container before exiting the back yard. Therefore, the lettuce is in the blue_container, which is option K. The correct answer is K. + +a: \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_1/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..bbc44bd87d708aefb6f01ccc42b57bb2df9226af --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_1/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Isabella really think the lettuce is? +Answer: blue_container +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to trace Isabella's movements with the lettuce. According to the story, Isabella moved the lettuce to the blue container (step 11). Therefore, the correct answer is K. blue_container. + +a: \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_1/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f615dc70225420f76e36621ea443e78ebef6032e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_1/order_2.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Abigail think Isabella thinks the lettuce is? +Answer: red_basket +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To answer this question, we need to track the movements of the lettuce and the agents' interactions. Here are the steps to solve the question: + +1. Abigail moved the lettuce to the red_basket. +2. Isabella moved the lettuce to the blue_container. +3. Isabella exited the hallway. +4. Abigail exited the hallway. + +Based on the assumptions, Abigail can only infer Isabella's thought if they had a private or public interaction. However, there is no mention of any interaction between Abigail and Isabella in the story. Therefore, we cannot determine where Abigail thinks Isabella thinks the lettuce is. + +The answer is not provided in the options given. + +a: 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_1/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c089ee1fcde23bde8c43d820aef423fea2b2b0ac --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_1/order_3.txt @@ -0,0 +1,53 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Nathan think Abigail thinks Isabella thinks the lettuce is? +Answer: green_cupboard +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_cupboard +GPT-4 Explain: First, we need to determine where the lettuce actually is. According to the story, the lettuce was moved several times. It started in the blue_container, then Nathan moved it to the green_cupboard, Logan moved it to the blue_treasure_chest, Abigail moved it to the red_basket, and finally Isabella moved it back to the blue_container. So, the lettuce is in the blue_container. + +Next, we need to determine the thought process of Nathan, Abigail, and Isabella. Nathan dislikes lettuce, so he probably didn't pay much attention to where it was moved. Abigail moved the lettuce to the red_basket, but we don't know if she knew where it was before that. Isabella moved the lettuce back to the blue_container, so she definitely knows where it is. + +Now, we need to determine where Nathan thinks Abigail thinks Isabella thinks the lettuce is. Since Nathan dislikes lettuce and probably didn't pay much attention to where it was moved, he may not have a strong opinion on where Abigail or Isabella think it is. However, we do know that Isabella moved the lettuce back to the blue_container, so Nathan may assume that Abigail thinks it is still in the red_basket. Therefore, Nathan may think that Abigail thinks Isabella thinks the lettuce is in the red_basket. + +The answer is A. red_crate. + +a: 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_1/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d3505806a69081b92619100523e50b72cbf48294 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_1/order_4.txt @@ -0,0 +1,59 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Logan think Nathan thinks Abigail thinks Isabella thinks the lettuce is? +Answer: green_cupboard +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_cupboard +GPT-4 Explain: First, we need to determine where the lettuce is at the end of the story. Isabella moved the lettuce to the blue container (step 11). + +Next, we need to determine where Abigail moved the lettuce. Abigail moved the lettuce to the red basket (step 9). + +Then, we need to determine where Nathan moved the tangerine. Nathan moved the tangerine to the red container (step 34). + +Now, we need to determine where Logan moved the melon. Logan moved the melon to the red crate (step 22). + +Finally, we need to determine where Nathan thinks Abigail thinks Isabella thinks the lettuce is. Since Nathan dislikes lettuce (step 18), he is unlikely to have moved it. Abigail moved the lettuce to the red basket, but we don't know what she thinks about where it is. Isabella moved the lettuce to the blue container, but we don't know what she thinks about where it is. Logan moved the lettuce to the blue treasure chest (step 5), but we need to determine where he thinks Abigail thinks Isabella thinks the lettuce is. + +Logan dislikes lettuce (step 13), so he is unlikely to have moved it. We know that Isabella moved the lettuce to the blue container (step 11), but we don't know what she thinks about where it is. Abigail moved the lettuce to the red basket (step 9), but we don't know what she thinks about where it is. Nathan moved the tangerine to the red container (step 34), but we don't know what he thinks about where the lettuce is. + +Based on the given information, we cannot determine where Logan thinks Nathan thinks Abigail thinks Isabella thinks the lettuce is. Therefore, the answer is not provided in the options given. + +a: 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_10/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d88a7a6faabf3b3bd9dbcbbb75c6ff36ceaafefd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_10/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where is the sweet_potato really? +Answer: red_container +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: To answer this question, we need to track the movements of the sweet_potato throughout the story. Initially, the sweet_potato is in the red_container in the kitchen. Ava moves it to the blue_cupboard before leaving the kitchen. Charlotte then moves it to the green_drawer before leaving the kitchen. Finally, William moves it back to the red_container before leaving the kitchen. Therefore, the sweet_potato is really in the red_container, which is option F. The other options are all places where the sweet_potato was temporarily moved to but not where it currently is. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_10/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ab6d8929fe08ca70ccf0499bfc33d73498b5f937 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_10/order_1.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does Evelyn really think the sweet_potato is? +Answer: blue_cupboard +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: To answer this question, we need to track the movements of the sweet_potato and the agents who interacted with it. The sweet_potato was initially in the red_container when all five agents entered the kitchen. Ava moved it to the blue_cupboard before leaving the kitchen. Charlotte then moved it to the green_drawer before leaving the kitchen. Finally, William moved it back to the red_container before leaving the kitchen. + +Evelyn was the only agent who did not interact with the sweet_potato in the kitchen. She then entered the hallway with Ava and Logan, where they saw the peas in the red_basket. Evelyn moved the peas to the green_bathtub before leaving the hallway. + +Based on the assumptions given, we know that Evelyn can only infer the location of the sweet_potato based on her interactions with other agents or their public claims. Since she did not interact with the sweet_potato in the kitchen, she would have to rely on the claims of Ava, Charlotte, William, or Logan. + +However, we also know that every agent tends to lie, so their claims cannot be trusted. Therefore, we cannot determine where Evelyn really thinks the sweet_potato is based on the given information. The answer is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_10/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2e7b524b6f81dba4b0fb56d4dbc34a378538aecf --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_10/order_2.txt @@ -0,0 +1,55 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does Logan think Evelyn thinks the sweet_potato is? +Answer: red_container +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: To answer this question, we need to track the movements of Logan and Evelyn and their interactions with the sweet_potato. Logan entered the kitchen with Evelyn, Ava, Charlotte, and William. He made no movements and stayed in the kitchen for 1 minute before exiting. Evelyn also made no movements and stayed in the kitchen for 1 minute before exiting. + +Ava saw a mouse and moved the sweet_potato from the red_container to the blue_cupboard before exiting the kitchen. Charlotte then moved the sweet_potato to the green_drawer before exiting the kitchen. Finally, William moved the sweet_potato back to the red_container before exiting the kitchen. + +Logan, Ava, and Evelyn then entered the hallway, where the peas were located in the red_basket. Ava made no movements and stayed in the hallway for 1 minute before exiting. Logan also made no movements and stayed in the hallway for 1 minute before exiting. Evelyn then moved the peas to the green_bathtub before exiting the hallway. + +Logan, William, Evelyn, and Charlotte then entered the bedroom, where the banana was located in the green_cupboard. William moved the banana to the green_bottle before exiting the bedroom. Logan then moved the banana to the green_envelope before exiting the bedroom. Evelyn then moved the banana to the red_crate before exiting the bedroom. Finally, Charlotte moved the banana to the green_pantry before exiting the bedroom. + +Based on these movements, we can determine that Logan and Evelyn were both in the kitchen when the sweet_potato was moved around. However, Logan made no movements and did not interact with the sweet_potato, so he would not have any information about its location beyond what he saw when he first entered the kitchen. + +Evelyn, on the other hand, stayed in the kitchen for 1 minute and may have seen the sweet_potato being moved around. However, we do not have any information about where she thinks the sweet_potato is. Therefore, we cannot determine where Logan thinks Evelyn thinks the sweet_potato is. The answer is not provided in the given options. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_10/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e24fa0bdbb1c8032d48a9b9c4b852a349a6c7eb4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_10/order_3.txt @@ -0,0 +1,63 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does Charlotte think Logan thinks Evelyn thinks the sweet_potato is? +Answer: red_container +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: To answer this question, we need to track the movements of each character and their interactions. Here are the steps to solve the question: + +1. Charlotte moved the sweet_potato to the green_drawer. +2. William moved the sweet_potato to the red_container. +3. Logan, Ava, Evelyn, Charlotte, and William entered the waiting_room. +4. Ava, Logan, and Evelyn entered the hallway. +5. Evelyn moved the peas to the green_bathtub. +6. William, Logan, Evelyn, and Charlotte entered the bedroom. +7. William moved the banana to the green_bottle. +8. Logan moved the banana to the green_envelope. +9. Evelyn moved the banana to the red_crate. +10. Charlotte moved the banana to the green_pantry. +11. William, Logan, Evelyn, and Charlotte entered the waiting_room. + +Based on the assumption that an agent can only infer another agent's thought if they have been in the same place or have had private or public interactions, we can conclude that Charlotte has no way of knowing where Logan thinks Evelyn thinks the sweet_potato is. + +None of the movements or interactions mentioned in the story involve Logan, Evelyn, or the sweet_potato after Charlotte moved it to the green_drawer and William moved it to the red_container. Therefore, Charlotte cannot infer Logan's thoughts on where Evelyn thinks the sweet_potato is. + +The answer is none of the above options. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_10/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1e856051630bfcfa2229e85ad56cc0de275f3cd1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_10/order_4.txt @@ -0,0 +1,65 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does William think Charlotte thinks Logan thinks Evelyn thinks the sweet_potato is? +Answer: red_container +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: To answer this question, we need to trace the movements of each character and their interactions. Here are the steps to follow: + +1. William moved the sweet_potato to the red_container. +2. Charlotte moved the sweet_potato to the green_drawer. +3. Logan did not move the sweet_potato. +4. Ava moved the sweet_potato to the blue_cupboard. +5. Evelyn did not move the sweet_potato. + +Based on these movements, we can see that the sweet_potato was moved to different locations by different characters. However, we need to determine where William thinks Charlotte thinks Logan thinks Evelyn thinks the sweet_potato is. + +Since William and Charlotte were both in the kitchen when the sweet_potato was first introduced, they could have interacted and shared their thoughts. However, Logan did not move the sweet_potato, so he may not have had a strong opinion on its location. + +Evelyn moved the peas to the green_bathtub in the hallway, but this does not give us any information about her thoughts on the sweet_potato. + +Therefore, we need to focus on Charlotte's movements and her potential interactions with William. Charlotte moved the sweet_potato to the green_drawer, which means she may have thought it was a good location for it. William may have observed this and inferred that Charlotte thinks the sweet_potato should be in the green_drawer. + +However, we still need to determine what Charlotte thinks Logan thinks Evelyn thinks about the sweet_potato. Since Logan did not move the sweet_potato, he may not have had a strong opinion on its location. Therefore, Charlotte's thoughts on Logan's thoughts may not be relevant. + +Evelyn moved the peas to the green_bathtub, but this does not give us any information about her thoughts on the sweet_potato. + +Therefore, we can conclude that William thinks Charlotte thinks the sweet_potato is in the green_drawer, but we cannot determine what Charlotte thinks Logan thinks Evelyn thinks about the sweet_potato. The answer is J. green_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_11/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..95f2c9a03497770a3e088521070d05f0166bf30d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_11/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where is the melon really? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: To solve this question, we need to track the movements of the agents and the location of the melon. According to the story, the melon was initially in the green_bathtub, then moved to the blue_pantry by Aiden, then to the green_bucket by Emma, and finally to the green_bathtub by Isla. Therefore, the melon is actually in the green_bathtub. The answer is A. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_11/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e69464555783b2090218021bb19c2b034256c892 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_11/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does William really think the melon is? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: To answer this question, we need to track William's movements and the movements of the melon. William entered the porch with the group, made no movements, and then exited. Therefore, he did not move the melon to the blue_pantry or the green_bucket. The melon was eventually moved to the green_bathtub by Isla. William then entered the waiting_room with the group and later exited to the front_yard. Isla moved the beans to the green_bottle in the front_yard, but there is no mention of the melon being moved again. Therefore, based on the story and assumptions, William really thinks the melon is in the green_bathtub. The answer is A. green_bathtub. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_11/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c6644e99af1174239aae5bed220308747ab60192 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_11/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does Lily think William thinks the melon is? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: To answer this question, we need to track the movements of William and Lily and their interactions with the melon. William entered the porch and made no movements, so he did not interact with the melon. Lily also made no movements in the porch, so she did not interact with the melon either. Aiden moved the melon to the blue_pantry, so Lily could have seen this happen. However, we do not know if Lily trusts Aiden's movements or not. Therefore, we cannot determine where Lily thinks William thinks the melon is based on the given information. The answer is not provided in the options given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_11/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6eae3fc1622678e970c5a1ee7f144ad59c75575a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_11/order_3.txt @@ -0,0 +1,133 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does Emma think Lily thinks William thinks the melon is? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Emma think Lily thinks William thinks the melon is? + +2. We know that William, Lily, Aiden, Emma, and Isla entered the porch together. + +3. William made no movements and stayed in the porch for 1 minute before exiting. + +4. Lily made no movements and stayed in the porch for 1 minute before exiting. + +5. Aiden moved the melon to the blue_pantry. + +6. Lily likes the green_bucket. + +7. Emma moved the melon to the green_bucket. + +8. Isla moved the melon to the green_bathtub. + +9. William, Lily, Aiden, Emma, and Isla entered the waiting_room together. + +10. Emma, Isla, and Aiden entered the basement together. + +11. The watermelon is in the blue_suitcase. + +12. Emma made no movements and stayed in the basement for 1 minute before exiting. + +13. Isla moved the watermelon to the blue_bottle. + +14. Aiden made no movements and stayed in the basement for 1 minute before exiting. + +15. Emma, Isla, and Aiden entered the waiting_room together. + +16. Aiden likes the red_pantry. + +17. William, Isla, Aiden, and Lily entered the front_yard together. + +18. The beans is in the red_bottle. + +19. William made no movements and stayed in the front_yard for 1 minute before exiting. + +20. Isla likes the green_cupboard. + +21. Isla moved the beans to the green_bottle. + +22. Aiden made no movements and stayed in the front_yard for 1 minute before exiting. + +23. Lily made no movements and stayed in the front_yard for 1 minute before exiting. + +24. William, Isla, Aiden, and Lily entered the waiting_room together. + +Based on the story and assumptions, we can infer that Emma thinks Lily thinks William thinks the melon is in the green_bucket. Here's why: + +1. Emma moved the melon to the green_bucket. + +2. Lily likes the green_bucket. + +3. William made no movements and stayed in the porch for 1 minute before exiting, so he did not see where the melon was moved. + +4. Lily made no movements and stayed in the porch for 1 minute before exiting, so she did not see where the melon was moved. + +5. Aiden moved the melon to the blue_pantry, so he knows where it is but did not exit the porch after moving it. + +6. Isla moved the melon to the green_bathtub, so she knows where it is but did not exit the porch after moving it. + +7. Emma, Isla, and Aiden entered the basement together, so they know where the watermelon is but did not see where the melon was moved. + +8. The watermelon is in the blue_suitcase, so it is not relevant to the location of the melon. + +9. Isla moved the watermelon to the blue_bottle, so she knows where it is but did not see where the melon was moved. + +10. Aiden likes the red_pantry, so he may have a bias towards thinking the melon is in the red_pantry. + +11. William, Isla, Aiden, and Lily entered the front_yard together, so they did not see where the melon was moved. + +12. The beans is in the red_bottle, so it is not relevant to the location of the melon. + +13. William made no movements and stayed in the front_yard for 1 minute before exiting, so he did not see where the melon was moved. + +14. Isla likes the green_cupboard, so she may have a bias towards thinking the melon is in the green_cupboard. + +15. Isla moved the beans to the green_bottle, so she knows where they are but did not see where the melon was moved. + +16. Aiden made no movements and stayed in the front_yard for 1 minute before exiting, so he did not see where the melon was moved. + +17. Lily made no movements and stayed in the front_yard for 1 minute before exiting, so she did not see where the melon was moved. + +18. William, Isla, Aiden, and Lily entered the waiting_room together, so they did not have any private or public interactions that would give them information about the location of the melon. + +Based on these observations, we can conclude that Emma thinks Lily thinks William thinks the melon is in the green_bucket, since Emma moved the melon there and Lily likes the green_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_11/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d4ed58b21fbcb575cfea65f55141cf08c39074ef --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_11/order_4.txt @@ -0,0 +1,57 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does Isla think Emma thinks Lily thinks William thinks the melon is? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: This is a complex question that requires breaking down the relationships between the characters and their movements. To start, we need to identify the chain of thoughts that Isla is considering. According to the question, Isla is thinking about what Emma thinks Lily thinks William thinks about the melon's location. + +We know that the melon starts in the green_bathtub and is eventually moved to the blue_pantry and then to the green_bucket before being moved again to the green_bathtub. Emma, Isla, and Aiden are the only ones who move the melon. + +Based on the assumption that agents tend to trust those who exit a room later than themselves, we can assume that Isla trusts Emma's movements more than Lily's or William's. + +Therefore, we need to trace Emma's movements and determine where she thinks the melon is located. Emma moves the melon to the green_bucket, so she thinks it is in the green_bucket. + +Next, we need to determine where Lily thinks the melon is located. Lily makes no movements, so we need to look at her likes and dislikes. According to the story, Lily likes the green_bucket, so she likely thinks the melon is in the green_bucket. + +Finally, we need to determine where William thinks the melon is located. William makes no movements and stays in the porch and front yard for one minute each. We don't have any information about his likes or dislikes, so we can't make any assumptions about where he thinks the melon is located. + +Therefore, Isla thinks that Emma thinks Lily thinks the melon is in the green_bucket. The answer is C. green_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_12/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..83ef99b5162d04cf840571e5261a2a1176f57516 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_12/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where is the beans really? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to track the movements of each agent and where they moved the beans. According to the story, the beans were initially in the blue_suitcase. Jack moved the beans to the green_treasure_chest, but then Benjamin moved the beans back to the blue_suitcase. Therefore, the beans are still in the blue_suitcase. The answer is A. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_12/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..165adccaad1d2e719cee9cf62b2e2f7095ca6350 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_12/order_1.txt @@ -0,0 +1,63 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Jack really think the beans is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: Step 1: Look for clues in the story about Jack's movements and interactions. +- Jack moved the beans to the green_treasure_chest (line 7). +- Jack made no movements and stayed in the workshop for 1 minute (line 18). +- Jack made no movements and stayed in the hall for 1 minute (line 28). +- Jack exited the hall (line 29). + +Step 2: Use the assumptions to infer Jack's actual thought. +- Jack may lie about where he thinks the beans is. +- Jack may trust Benjamin's claim about the beans' location since Benjamin exited the hall after him. +- Jack may have private or public interactions with Owen, Jackson, or Benjamin that could affect his actual thought. + +Step 3: Eliminate answer choices that have no connection to Jack's movements or interactions. +- Blue_bathtub, green_bathtub, green_envelope, blue_bottle, blue_cupboard, blue_bucket, green_bottle, red_box, red_container, green_pantry, green_cupboard, and red_bottle have no connection to Jack's movements or interactions. + +Step 4: Consider the remaining answer choices and how they relate to Jack's movements and interactions. +- Blue_suitcase: Jack moved the beans to the green_treasure_chest, so he may not think the beans is still in the blue_suitcase. +- Green_treasure_chest: Jack moved the beans here, so he may think the beans is still here. +- Red_basket: There is no indication that Jack interacted with the red_basket or had any private or public interactions that would lead him to believe the beans is there. + +Step 5: Choose the answer choice that best fits the clues and assumptions. +- Based on the story and assumptions, it is most likely that Jack thinks the beans is in the green_treasure_chest. Therefore, the answer is E. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_12/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..fa304943944686ed6205657508288abde0b016a7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_12/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Owen think Jack thinks the beans is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to track Owen and Jack's movements and where the beans were moved to. According to the story, Owen and Jack both entered the hall together with the beans in the blue suitcase. Jack then moved the beans to the green treasure chest before exiting the hall. Owen made no movements in the hall and exited after Jack. + +Based on the assumptions given, we know that Owen can only infer Jack's thoughts if they had private or public interactions. However, there is no mention of any interactions between Owen and Jack regarding the location of the beans. Therefore, we cannot determine where Owen thinks Jack thinks the beans are. + +The answer is: Cannot be determined. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_12/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..3102d603cc879f0e8d86588fe499ff247320121c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_12/order_3.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Liam think Owen thinks Jack thinks the beans is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to trace the movements of Owen, Jack, and Liam and their interactions with each other. + +According to the story, Owen and Liam both entered the hall and made no movements before exiting. Jack then moved the beans to the green_treasure_chest before exiting. + +There is no mention of Liam interacting with Owen or Jack in the hall, so we cannot infer what Liam thinks about their thoughts on the location of the beans. + +Therefore, the answer is not provided in the story and the correct answer is not listed among the options. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_12/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9efb2a32c58f311bbb0337f40f0d20ee074be31e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_12/order_4.txt @@ -0,0 +1,55 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Benjamin think Liam thinks Owen thinks Jack thinks the beans is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: This is a complex question that requires careful analysis. We need to trace the path of the beans and the movements of the agents to determine where Benjamin thinks Liam thinks Owen thinks Jack thinks the beans is. + +According to the story, the beans start in the blue_suitcase (2), then Jack moves them to the green_treasure_chest (7), and finally Benjamin moves them back to the blue_suitcase (11). + +We know that Owen and Liam make no movements in the hall (3, 5) and that Owen likes the blue_bathtub (26). Jack also makes no movements in the hall (28). + +In the workshop, we learn that the cherry is in the red_basket (15). Owen, Jack, and Jackson make no movements in the workshop (16, 18, 20). + +Finally, all four agents (Owen, Jack, Benjamin, and Jackson) enter the hall together (23) and the beans are still in the blue_suitcase (24). Owen makes no movements in the hall (25) and likes the blue_bathtub (26). Jack also makes no movements in the hall (28). Benjamin and Jackson make no movements in the hall (30, 32). + +Based on this information, we can determine that Benjamin thinks Liam thinks Owen thinks the beans is in the blue_suitcase (A). This is because the beans start and end in the blue_suitcase, and none of the agents who make movements (Jack, Benjamin, and Jackson) move the beans anywhere else. Liam and Owen also make no movements in the hall, so they would not have seen the beans move. + +Therefore, the answer is A. blue_suitcase. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_13/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b2a3516835494f464ecb01362efdd2f6666fd7e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_13/order_0.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where is the corn really? +Answer: green_bottle +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to track the movements of the corn and the statements made by the agents. According to the story, the corn was initially in the green_bathtub (step 2). William moved the corn to the green_cupboard (step 3), and then Emily moved it to the red_envelope (step 7). Isla then moved the corn to the green_bottle (step 11), and finally, Jackson moved it back to the green_bathtub (step 13). + +Therefore, the correct answer is K. green_bathtub. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_13/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..10569d0d675e98e0504beb7261af2355485c6a88 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_13/order_1.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does William really think the corn is? +Answer: green_bathtub +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: To answer this question, we need to track William's movements and the movements of the corn. According to the story, William initially moved the corn from the green_bathtub to the green_cupboard. Later, Isla moved the corn from the green_cupboard to the green_bottle, and then Jackson moved the corn back to the green_bathtub. When William, Isla, Emily, and Emma entered the pantry again, the corn was back in the green_bathtub. William made no movements and stayed in the pantry for one minute before leaving. + +Based on this information, we can eliminate options A, B, C, D, E, F, G, I, J, and L because William never moved the corn to any of those locations. We can also eliminate option O because Emma, not William, likes the blue_crate. + +That leaves us with options H and N. Isla moved the corn to the green_cupboard before William entered the pantry, so it's possible that William thinks the corn is still in the green_cupboard. However, when William and the others entered the pantry again, the corn was in the green_bathtub. Since William made no movements and stayed in the pantry for one minute before leaving, it's possible that he saw the corn in the green_bathtub and thinks that's where it is. + +Therefore, the answer is N. William really thinks the corn is in the green_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_13/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..62ede8f7ade2b7e9ead779a63c684638890db37f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_13/order_2.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does Emily think William thinks the corn is? +Answer: green_bathtub +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: To answer this question, we need to track the movements of William and the corn. William initially moved the corn from the green_bathtub to the green_cupboard, but later made no movements and stayed in the pantry for a minute before exiting. Emily then moved the corn from the green_cupboard to the red_envelope before exiting the pantry. Isla then moved the corn from the red_envelope to the green_bottle before exiting the pantry. Jackson then moved the corn from the green_bottle back to the green_bathtub before exiting the pantry. + +Based on these movements, Emily would know that William moved the corn from the green_bathtub to the green_cupboard, but she would not know that he later made no movements and stayed in the pantry for a minute. Therefore, she would think that William still believes the corn is in the green_cupboard. + +The answer is M. green_cupboard. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_13/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..74081e9b883462949c7e6de5e526bdc30aa5abf2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_13/order_3.txt @@ -0,0 +1,69 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does Emma think Emily thinks William thinks the corn is? +Answer: green_bathtub +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: To answer this question, we need to trace the movements of William, Emily, and Emma in relation to the corn. + +1. William, Emily, Emma, Isla, and Jackson entered the pantry. +2. The corn is in the green_bathtub. +3. William moved the corn to the green_cupboard. +4. Emma likes the blue_crate. +6. William dislikes the corn. +7. Emily moved the corn to the red_envelope. +10. Emma exited the pantry. +11. Isla moved the corn to the green_bottle. +13. Jackson moved the corn to the green_bathtub. +15. William, Emily, Emma, Isla, and Jackson entered the waiting_room. +26. William, Isla, Emily, and Emma entered the pantry. +27. The corn is in the green_bathtub. +30. Isla moved the corn to the green_cupboard. +32. Emily moved the corn to the blue_crate. +35. Emma moved the corn to the green_bottle. +37. William, Isla, Emily, and Emma entered the waiting_room. + +Based on these movements, we know that William initially moved the corn from the green_bathtub to the green_cupboard, and then later made no movements when he re-entered the pantry. Emily moved the corn from the green_cupboard to the red_envelope, and then later moved it to the blue_crate. Emma made no movements with the corn in the first pantry visit, and then moved it to the green_bottle in the second pantry visit. + +Since Emma never witnessed William's dislike of the corn, she may assume that he still thinks the corn is in the green_bathtub. However, we need to determine where she thinks Emily thinks William thinks the corn is. + +We know that Emily moved the corn from the green_cupboard to the red_envelope, and then to the blue_crate. Since Emma likes the blue_crate, she may assume that Emily thinks William thinks the corn is in the blue_crate. Therefore, the answer is option D. blue_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_13/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5dc69b4d41bfa8b9cd4131ace2f4e8a4c3226f40 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_13/order_4.txt @@ -0,0 +1,60 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does Jackson think Emma thinks Emily thinks William thinks the corn is? +Answer: green_bathtub +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: This is a complex question that requires breaking down the thought process of each agent involved. + +Starting with Jackson, he moved the corn to the green bathtub and then exited the pantry. He did not witness any of the subsequent movements of the corn. + +Next, Isla moved the corn to the green bottle before exiting the pantry. + +Then, Emily moved the corn to the blue crate and saw a mouse before exiting the pantry. + +Finally, Emma moved the corn to the green bottle before exiting the pantry. + +William did not move the corn during this sequence, but he did move the asparagus from the green bucket to the green drawer while in the crawlspace. + +Based on these movements, Jackson would think that Emma thinks the corn is in the green bottle, since that is where she last moved it. However, he cannot infer what Emily or William think about the corn's location since he did not witness their movements. + +Therefore, the answer is N. green bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_14/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..43f28c16cdfe7ffe8bf58f11b2b4d3b16704d658 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_14/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where is the cucumber really? +Answer: red_pantry +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: To answer this question, we need to track the movements of the agents and the location of the cucumber. According to the story, Abigail moved the cucumber to the blue_container, and then Hannah moved it to the blue_bathtub. Owen later moved the carrot to the red_pantry, but there is no mention of him moving the cucumber. Therefore, the cucumber is still in the blue_bathtub. The answer is K. blue_bathtub. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_14/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b78af8a686aecafe0720caea1db7f034830c6b71 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_14/order_1.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Avery really think the cucumber is? +Answer: red_pantry +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: To solve this question, we need to track Avery's movements and any interactions he had with other agents regarding the cucumber. According to the story, Avery made no movements after Hannah exited the basement with the cucumber in the blue_bathtub. Therefore, Avery did not move the cucumber to any other location. We also do not have any information about Avery having any private or public interactions regarding the cucumber. + +Based on these assumptions, we can conclude that Avery really thinks the cucumber is still in the blue_bathtub. Therefore, the answer is K. blue_bathtub. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_14/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..483328afd8c080813aa56180d26efac7e58baf02 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_14/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Abigail think Avery thinks the cucumber is? +Answer: blue_container +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to track the movements of Abigail and Avery with respect to the cucumber. Abigail moved the cucumber to the blue_container in step 3 and then exited the basement in step 4. Avery made no movements with respect to the cucumber and stayed in the basement for 1 minute in step 13 before exiting in step 14. Therefore, Abigail thinks that Avery thinks the cucumber is still in the blue_container. The answer is O. blue_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_14/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..dd3a44a8c32efd46498d7559243707a17529064d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_14/order_3.txt @@ -0,0 +1,61 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Hannah think Abigail thinks Avery thinks the cucumber is? +Answer: blue_container +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: This is a complex question that requires careful analysis of the story and the assumptions given. To break it down, we need to identify the agents involved and their movements related to the cucumber. + +Agents involved: Abigail, Hannah, Avery + +Movements related to the cucumber: +- The cucumber is initially in the blue_drawer. +- Abigail moves the cucumber to the blue_container. +- Hannah moves the cucumber to the blue_bathtub. + +Based on assumption (2), Hannah can only infer Abigail's thought if they have been in the same place or have had private or public interactions. From the story, we know that Abigail exited the basement before Hannah entered it again. Therefore, they did not have any interactions in the basement. + +However, we also know from assumption (4) that Hannah tends to trust Abigail more than Avery because Abigail exited the basement later than Avery. Therefore, Hannah may assume that Abigail knows where the cucumber is. + +From the story, we know that the cucumber is in the blue_bathtub when Hannah exits the basement. Therefore, Hannah may think that Abigail thinks Avery thinks the cucumber is in the blue_bathtub. + +The answer is K. blue_bathtub. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_14/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b4fc318bd8a1f4166b255bd2d4fb178ee123b747 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_14/order_4.txt @@ -0,0 +1,58 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Owen think Hannah thinks Abigail thinks Avery thinks the cucumber is? +Answer: blue_container +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: This is a complex question that requires careful analysis of the story and the assumptions given. To start, we need to identify the agents involved in the question: Owen, Hannah, Abigail, and Avery. + +Next, we need to trace the movements of the cucumber and who interacted with it. According to the story, Abigail moved the cucumber to the blue_container, Hannah later moved it to the blue_bathtub, and Owen moved it to the red_pantry. Avery did not interact with the cucumber at all. + +Now we can start to piece together the answer. We know that Owen is the one doing the thinking, and he is trying to determine where Hannah thinks Abigail thinks Avery thinks the cucumber is. + +Based on the story, we know that Abigail moved the cucumber to the blue_container, but we don't know if she told anyone else about it. Hannah later moved the cucumber to the blue_bathtub, so she must have thought it was there. However, we don't know if she knew that Abigail had moved it to the blue_container. + +Since Owen moved the cucumber to the red_pantry, he must have thought it was there. But we don't know if he knew where Hannah thought it was. + +So, to answer the question, we need to determine where Hannah thought the cucumber was and whether she knew where Abigail had moved it. Based on the story, we can assume that Hannah did not know that Abigail had moved the cucumber to the blue_container, since she later moved it to the blue_bathtub. + +Therefore, Owen would think that Hannah thinks Abigail thinks Avery thinks the cucumber is in the blue_bathtub (option K). \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_15/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..626e4934672dda007d55b4916317978474516ced --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_15/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where is the sweet_potato really? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to track the movements of the sweet_potato and the agents. According to the story, the sweet_potato was initially in the green_bottle when Jacob, Mila, Elizabeth, Aiden, and Amelia entered the master_bedroom. Aiden then moved the sweet_potato to the blue_bucket before exiting the master_bedroom. However, Amelia later moved the sweet_potato back to the green_bottle before leaving the master_bedroom. Therefore, the sweet_potato is really in the (B) green_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_15/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..462e12949e65df2acb886eb00e7aec5e4109c06a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_15/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Jacob really think the sweet_potato is? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to track Jacob's movements and the movements of the sweet_potato. Jacob entered the master_bedroom with the sweet_potato in the green_bottle. He made no movements and stayed in the master_bedroom for 1 minute before exiting. Aiden then moved the sweet_potato to the blue_bucket, and later Amelia moved it back to the green_bottle before they all entered the waiting_room. Jacob did not have any private or public interactions with Aiden or Amelia regarding the sweet_potato. Therefore, we cannot infer Jacob's actual thought about the sweet_potato's location. The answer is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_15/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..081482511ac49f7fedf14e4d506d54a586c81d63 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_15/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Aiden think Jacob thinks the sweet_potato is? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to track the movements of Aiden and Jacob regarding the sweet_potato. Aiden moved the sweet_potato to the blue_bucket, and then he exited the master_bedroom. Jacob did not move the sweet_potato and exited the master_bedroom after Aiden. Therefore, according to assumption (4), Aiden tends to trust Jacob's thoughts more than his own. Since Jacob did not move the sweet_potato, Aiden would think that Jacob still believes the sweet_potato is in the original location, which is the green_bottle. Therefore, the answer is B. green_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_15/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad37f3d3f3f3b647fc5fed56c8345936fa87cb22 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_15/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Mila think Aiden thinks Jacob thinks the sweet_potato is? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to track the movements of Aiden, Jacob, and Mila regarding the sweet_potato. Aiden moved the sweet_potato to the blue_bucket, and then he exited the master_bedroom. Jacob made no movements and stayed in the master_bedroom for 1 minute before exiting. Mila also made no movements and stayed in the master_bedroom for 1 minute before exiting. Therefore, Mila knows that Aiden moved the sweet_potato to the blue_bucket, but she doesn't know where Jacob thinks the sweet_potato is. So, Mila cannot think about where Aiden thinks Jacob thinks the sweet_potato is. The answer is not given in the story. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_15/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..137dbce602211c7d84a485452f0ee274115eaa1a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_15/order_4.txt @@ -0,0 +1,63 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Elizabeth think Mila thinks Aiden thinks Jacob thinks the sweet_potato is? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To solve this question, we need to track the movements of each agent and their interactions. + +- Jacob and Mila entered the master_bedroom and made no movements. +- Elizabeth also entered the master_bedroom and made no movements. +- Aiden moved the sweet_potato to the blue_bucket. +- Amelia moved the sweet_potato to the green_bottle. +- All agents entered the waiting_room. +- Amelia, Mila, and Elizabeth entered the crawlspace. +- Amelia lost his watch. +- Mila moved the carrot to the green_treasure_chest. +- Elizabeth moved the carrot to the blue_pantry. +- All agents entered the office. +- Amelia moved the peach to the green_bucket. +- Jacob moved the peach to the green_drawer. +- Aiden and Mila made no movements. +- All agents entered the waiting_room. + +Based on the movements, we can infer that Elizabeth and Mila were in the same room (master_bedroom, waiting_room, crawlspace, and office). Aiden and Jacob were also in the same room (master_bedroom and office). However, there is no interaction between Mila and Aiden or Jacob, so Elizabeth cannot infer their thoughts. + +The only item that all agents interacted with is the sweet_potato. Aiden moved it to the blue_bucket, and Amelia moved it to the green_bottle. Therefore, Elizabeth thinks that Mila thinks Aiden thinks the sweet_potato is in the C. blue_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_16/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..549189f2a5dd0018eec0e73b786c5bd2e85bcbfc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_16/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where is the persimmon really? +Answer: red_basket +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To answer this question, we need to track the movements of the persimmon. According to the story, the persimmon was initially in the red_basket (step 2), then Hannah moved it to the blue_crate (step 3), then Carter moved it to the green_basket (step 7), and finally William moved it back to the red_basket (step 11). Therefore, the persimmon is really in the red_basket. The answer is F. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_16/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..97461a858e2516a97281f01720b3d8142c9bc585 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_16/order_1.txt @@ -0,0 +1,60 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does William really think the persimmon is? +Answer: red_basket +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To answer this question, we need to track the movements of the persimmon and the agents' interactions. + +1. Hannah, Alexander, Carter, Avery, and William entered the bedroom. +2. The persimmon is in the red_basket. +3. Hannah moved the persimmon to the blue_crate. +4. Hannah exited the bedroom. +5. Alexander made no movements and stayed in the bedroom for 1 minute. +6. Alexander exited the bedroom. +7. Carter moved the persimmon to the green_basket. +8. Carter exited the bedroom. +9. Avery made no movements and stayed in the bedroom for 1 minute. +10. Avery exited the bedroom. +11. William moved the persimmon to the red_basket. + +Based on the assumption that agents tend to lie, we cannot trust what William says about the persimmon's location. However, we can infer his actual thought based on his movements and interactions with other agents. + +William was the last agent to exit the bedroom, so he may trust the movements of the agents who exited before him. Carter moved the persimmon to the green_basket, but William moved it back to the red_basket. This suggests that William thinks the persimmon is in the red_basket, even though he may claim otherwise. + +Therefore, the answer is A. red_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_16/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f342aa49efe20acc51382677de4e8591f597266 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_16/order_2.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does Hannah think William thinks the persimmon is? +Answer: blue_crate +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To answer this question, we need to track the movements of the persimmon and the agents' interactions. + +1. Hannah moved the persimmon from the red_basket to the blue_crate. +2. Carter moved the persimmon from the blue_crate to the green_basket. +3. William moved the persimmon from the green_basket to the red_basket. + +Hannah exited the bedroom before any other agent moved the persimmon. Therefore, she does not know about Carter and William's movements. + +In the waiting room, Hannah, Alexander, Carter, Avery, and William were present. However, William, Alexander, and Hannah went to the bathroom, leaving only Carter and Avery in the waiting room. + +When they returned from the bathroom, William, Alexander, Avery, and Hannah went to the garage. There, Alexander moved the plum from the red_drawer to the green_cupboard, Avery moved it to the blue_treasure_chest, William moved it to the green_bottle, and Hannah moved it to the blue_bathtub. + +Since Hannah was not present when William moved the persimmon to the red_basket, she does not know where he thinks the persimmon is. Therefore, we cannot determine where Hannah thinks William thinks the persimmon is. + +The answer is: Cannot be determined. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_16/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..18acafba5296d23aabca18199fd2efe013150162 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_16/order_3.txt @@ -0,0 +1,86 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does Avery think Hannah thinks William thinks the persimmon is? +Answer: blue_crate +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To solve this question, we need to track the movements of the persimmon and the thoughts of the agents. Here are the steps to follow: + +1. Hannah moved the persimmon from the red_basket to the blue_crate. +2. Carter moved the persimmon from the blue_crate to the green_basket. +3. William moved the persimmon from the green_basket to the red_basket. + +So, the persimmon is currently in the red_basket. + +Now, let's track the movements of the agents and their thoughts: + +1. Hannah exited the bedroom and we don't know her thoughts. +2. Alexander made no movements and stayed in the bedroom for 1 minute. We don't know his thoughts. +3. Carter exited the bedroom and we don't know his thoughts. +4. Avery made no movements and stayed in the bedroom for 1 minute. We don't know her thoughts. +5. William exited the bedroom and we don't know his thoughts. +6. Hannah, Alexander, Carter, Avery, and William entered the waiting_room. We don't know their thoughts. +7. William, Alexander, and Hannah entered the bathroom. We don't know their thoughts. +8. William moved the banana from the red_bucket to the red_crate. We don't know his thoughts. +9. Alexander made no movements and stayed in the bathroom for 1 minute. We don't know his thoughts. +10. Hannah made no movements and stayed in the bathroom for 1 minute. We don't know her thoughts. +11. William, Alexander, and Hannah entered the waiting_room. We don't know their thoughts. +12. Alexander, Avery, William, and Hannah entered the garage. +13. Alexander moved the plum from the red_drawer to the green_cupboard. We don't know his thoughts. +14. Avery moved the plum from the green_cupboard to the blue_treasure_chest. We don't know her thoughts. +15. William moved the plum from the blue_treasure_chest to the green_bottle. We don't know his thoughts. +16. Hannah moved the plum from the green_bottle to the blue_bathtub. We don't know her thoughts. +17. Alexander, Avery, William, and Hannah entered the waiting_room. We don't know their thoughts. + +Based on the assumptions given, Avery can only infer William's thoughts if she has been in the same place as him or has had private or public interactions with him. We know that Avery and William were both in the garage, so Avery could have inferred William's thoughts about the persimmon. + +Since the persimmon is currently in the red_basket, we need to find out where William thinks the persimmon is. We know that Hannah moved the persimmon from the red_basket to the blue_crate, but we don't know if William is aware of this. We also don't know if William saw Carter move the persimmon to the green_basket. + +However, we do know that William moved the plum from the blue_treasure_chest to the green_bottle, which means he was aware of the location of the plum. Therefore, it's possible that he also knew the location of the persimmon. + +Based on this information, we can eliminate options A, D, F, and G, as there is no evidence that William thinks the persimmon is in any of these locations. We can also eliminate options C, E, H, and I, as there is no evidence that Hannah thinks the persimmon is in any of these locations. + +That leaves us with options B, J, K, L, M, and N. Since we don't have any direct evidence of William's thoughts about the persimmon, we need to look for clues in the movements of the agents. + +We know that Hannah moved the persimmon from the red_basket to the blue_crate, but we don't know if she told anyone about this. We also know that Carter moved the persimmon from the blue_crate to the green_basket, but we don't know if he told anyone about this either. + +However, we do know that Avery moved the plum from the green_cupboard to the blue_treasure_chest, which means she was aware of the location of the plum. Therefore, it's possible that she also knew the location of the persimmon. + +Based on this information, we can eliminate options K, L, and N, as there is no evidence that Avery thinks the persimmon is in any of these locations. We can also eliminate option M, as there is no evidence that Hannah thinks the persimmon is in the blue_bathtub. + +That leaves us with options B and J. Since Avery moved the plum from the green_cupboard to the blue_treasure_chest, it's possible that she thinks the persimmon is also in a blue container. Therefore, the most likely answer is J. Avery thinks Hannah thinks William thinks the persimmon is in the green_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_16/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e1445a301e1f22918aca8e86da8c5de6139fb93b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_16/order_4.txt @@ -0,0 +1,65 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does Alexander think Avery thinks Hannah thinks William thinks the persimmon is? +Answer: blue_crate +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. To start, we need to identify the agents involved in the question: Alexander, Avery, Hannah, and William. We also need to focus on the persimmon, which is the subject of the question. + +Step by step, we can determine the following: + +1. Hannah moved the persimmon to the blue_crate. +2. Hannah exited the bedroom. +3. Alexander made no movements and stayed in the bedroom for 1 minute. +4. Alexander exited the bedroom. +5. Carter moved the persimmon to the green_basket. +6. Avery made no movements and stayed in the bedroom for 1 minute. +7. William moved the persimmon to the red_basket. +8. Alexander, Avery, William, and Hannah entered the waiting_room. + +Based on these steps, we know that Alexander was in the bedroom with Hannah and Avery before the persimmon was moved. However, he did not make any movements and stayed in the bedroom for 1 minute before exiting. This means that he did not witness the persimmon being moved to the blue_crate by Hannah. + +Avery also did not move the persimmon and stayed in the bedroom for 1 minute before exiting. This means that she did not witness the persimmon being moved to the green_basket by Carter or to the red_basket by William. + +Hannah moved the persimmon to the blue_crate before exiting the bedroom. William moved the persimmon to the red_basket after Hannah left the bedroom. Therefore, Avery could have seen the persimmon in either the blue_crate or the red_basket, depending on when she exited the bedroom. + +However, we need to determine where Alexander thinks Avery thinks Hannah thinks William thinks the persimmon is. Since Alexander did not witness the persimmon being moved, he can only rely on what he heard from the other agents. + +Assuming that Avery trusts William more than Hannah (since William exited the bedroom after Hannah), she would believe that the persimmon is in the red_basket. However, since Alexander did not witness the persimmon being moved, he cannot be sure where it is. Therefore, he would likely think that Avery thinks Hannah thinks William thinks the persimmon is in the red_basket. + +The answer is A. red_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_17/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ea217f377da67bc004bbe8537a057f1ad305c919 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_17/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where is the eggplant really? +Answer: green_pantry +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: To answer this question, we need to track the movements of the eggplant throughout the story. According to the story, the eggplant was initially in the green_pantry (as stated in sentence 2). Emily then moved the eggplant to the blue_drawer (sentence 3), and later Emma moved it to the green_box (sentence 7). When Emily, Avery, Jack, and Emma re-entered the garage (sentence 23), the eggplant was in the green_box (sentence 15). Emily then moved the eggplant to the green_bottle (sentence 18), and Jack moved it to the green_pantry (sentence 20). Therefore, the correct answer is G. green_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_17/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..79aff7955276e6ecdb24b7bdb90d4679c9200341 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_17/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Emma really think the eggplant is? +Answer: green_pantry +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: To answer this question, we need to track the movements of the eggplant and where it ends up. According to the story, the eggplant starts in the green_pantry, is moved to the blue_drawer by Emily, then to the green_box by Emma, and finally to the green_bottle by Emily. Therefore, the correct answer is J. green_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_17/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ec5dc90b450dd0c204d470b150afb7ee6e5dfcca --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_17/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Jackson think Emma thinks the eggplant is? +Answer: green_box +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: To answer this question, we need to track the movements of Emma and the eggplant. According to the story, Emma moved the eggplant from the blue_drawer to the green_box, and then later moved it again to the green_bottle. Jackson was in the garage when Emma moved the eggplant to the green_box, but he made no movements and stayed in the garage for 1 minute before exiting. Therefore, he did not witness Emma moving the eggplant to the green_bottle. + +Based on assumption (2), Jackson can only infer Emma's thought about the eggplant if they had been in the same place or had private or public interactions. According to the story, Jackson and Emma did not have any private interactions, and there is no mention of any public interactions between them. Therefore, Jackson cannot accurately infer where Emma thinks the eggplant is. + +Since we cannot determine where Emma thinks the eggplant is, we cannot determine where Jackson thinks Emma thinks the eggplant is. The answer is not provided in the multiple-choice options. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_17/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..0bc36a177a0c71cf22ded694b2dcaab79dae755d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_17/order_3.txt @@ -0,0 +1,60 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Jack think Jackson thinks Emma thinks the eggplant is? +Answer: green_box +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: To answer this question, we need to trace the movements of Jack, Jackson, and Emma regarding the eggplant. + +- Jack entered the garage with Emily, Avery, Emma, and Jackson. +- Jack made no movements and stayed in the garage for 1 minute before exiting. +- Jackson made no movements and stayed in the garage for 1 minute before exiting. +- Emma moved the eggplant to the green_box while Jack was still in the garage. +- Later, Emma, Emily, and Jack entered the garage again. +- The eggplant was in the green_box at this point. +- Emma made no movements and stayed in the garage for 1 minute before exiting. +- Emily moved the eggplant to the green_bottle before exiting. +- Jack moved the eggplant to the green_pantry before exiting. + +Based on these movements, we can conclude that Jack knows the eggplant was in the green_pantry when he left the garage for the second time. However, we don't have any information about where Jackson thinks the eggplant is. + +Since Jackson made no movements regarding the eggplant and didn't witness any of the movements made by Emma, Emily, or Jack, he has no way of knowing where the eggplant is. Therefore, we cannot determine where Jack thinks Jackson thinks Emma thinks the eggplant is. + +The answer is: Cannot be determined. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_17/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7ac4de22753d902e67c1573bff0dd8cc1dcb04ca --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_17/order_4.txt @@ -0,0 +1,61 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Emily think Jack thinks Jackson thinks Emma thinks the eggplant is? +Answer: green_box +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Emily moved the eggplant to the blue_drawer. +2. Emma moved the eggplant to the green_box. +3. Jack moved the eggplant to the green_pantry. +4. The eggplant is in the green_box. + +Based on these movements, we can infer that Emily thinks that Jack thinks that the eggplant is in the green_box. + +5. Emily moved the cherry to the green_bottle. +6. Avery moved the cherry to the green_pantry. +7. Jack moved the cherry to the blue_cupboard. + +Based on these movements, we can infer that Jack likes the green_envelope, but we don't have any information about what Emily thinks about Jack's preference. + +8. Therefore, we cannot determine where Emily thinks Jack thinks Jackson thinks Emma thinks the eggplant is. + +None of the answer choices match the location of the eggplant that Emily thinks Jack thinks Jackson thinks Emma thinks it is in. Therefore, the answer is not provided in the multiple-choice options. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_18/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7ec0e01191618c9561aad4111d82d6ee5b5da2f8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_18/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where is the lime really? +Answer: blue_crate +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To solve this question, we need to track the movements of the lime and the agents who interacted with it. According to the story, the lime was initially in the blue_crate (statement 3). Elizabeth moved it to the green_pantry (statement 4), and then Nathan moved it to the green_basket (statement 9). Owen then moved it to the red_box (statement 11), and finally, Jackson moved it back to the blue_crate (statement 13). Therefore, the lime is really in the blue_crate (option L). The other options are not supported by the story. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_18/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b015ea38cc519dc6d90e9be3dc11ee30350d94e2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_18/order_1.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Elizabeth really think the lime is? +Answer: green_pantry +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: To answer this question, we need to track the movements of the lime and Elizabeth. According to the story, the lime was initially in the blue_crate, but Elizabeth moved it to the green_pantry. Therefore, Elizabeth knows that the lime is not in the blue_crate anymore. Later, Nathan moved the lime to the green_basket, and Owen moved it to the red_box. However, we don't have any information about Elizabeth's knowledge of these movements. + +Therefore, the only possible answer is N. green_pantry, as that is the last place Elizabeth knew the lime to be. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_18/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..429b13ff6a32aec9e9f7924846a1d8d5e5f95b16 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_18/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Alexander think Elizabeth thinks the lime is? +Answer: green_pantry +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: To answer this question, we need to track the movements of Elizabeth and the lime. According to the story, Elizabeth moved the lime from the blue_crate to the green_pantry before exiting the cellar. Later, Owen moved the lime to the red_box, and then Jackson moved it back to the blue_crate. Alexander then moved the plum to the red_drawer before exiting the workshop. + +Based on these movements, we can infer that Alexander thinks Elizabeth thinks the lime is in the green_pantry, since that was the last place Elizabeth was seen with the lime before it was moved by Owen and Jackson. Therefore, the answer is N. green_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_18/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f6ef3082fc20f8c4b4739efd9e3d57952286f81c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_18/order_3.txt @@ -0,0 +1,59 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Owen think Alexander thinks Elizabeth thinks the lime is? +Answer: green_pantry +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Here are the steps to solve the question: + +1. Identify the agents involved: Owen, Alexander, and Elizabeth. +2. Determine the order of their exits from the workshop: Elizabeth, Alexander, Nathan. +3. Focus on the movements of the lime and the plum, as they are the key items in the question. +4. Trace the movements of the lime: it starts in the blue_crate, is moved by Elizabeth to the green_pantry, then by Nathan to the green_basket, then by Owen to the red_box, and finally by Jackson back to the blue_crate. +5. Trace the movements of the plum: it starts in the green_box, is moved by Alexander to the red_drawer, then by Nathan to the green_cupboard. +6. Determine which locations Owen, Alexander, and Elizabeth have been in together, or have had private or public interactions. +7. Based on the assumptions, Owen can infer Alexander's thought about the location of the lime only if they have been in the same place, or have had private or public interactions. +8. From the story, we know that Owen and Alexander have been in the workshop together, and that Elizabeth has also been in the workshop, but has exited before Alexander. +9. Therefore, Owen can infer Alexander's thought about the location of the lime based on what he knows about Alexander's movements in the workshop. +10. Alexander moved the plum to the red_drawer, which is not the same location as the lime. +11. Therefore, Owen cannot infer Alexander's thought about the location of the lime based on his movements in the workshop. +12. The correct answer is therefore impossible to determine based on the given information. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_18/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..78a5af98a899d4f06992030d19876651d4c4e5e8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_18/order_4.txt @@ -0,0 +1,72 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Nathan think Owen thinks Alexander thinks Elizabeth thinks the lime is? +Answer: green_pantry +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: To answer this question, we need to trace the movements of the lime and the agents' interactions. + +- The lime starts in the blue_crate (step 3). +- Elizabeth moves the lime to the green_pantry (step 4). +- Nathan moves the lime to the green_basket (step 9). +- Owen moves the lime to the red_box (step 11). +- Jackson moves the lime back to the blue_crate (step 13). + +Based on the assumption that agents tend to lie, we cannot trust any agent's claim about where they think the lime is. However, we can use the exit order to infer who might have interacted with whom and potentially shared information. + +- Elizabeth exits the cellar first (step 5). +- Alexander exits the cellar next (step 8). +- Nathan exits the cellar after moving the lime (step 10). +- Owen exits the cellar after moving the lime (step 12). +- Jackson exits the cellar last (step 14). + +We know that Nathan moved the lime to the green_basket before exiting the cellar, so he knows that the lime is not in the blue_crate anymore. However, he has no information about where the lime is after he exits the cellar. + +Owen moved the lime to the red_box after Nathan, so he knows that the lime is not in the green_basket anymore. However, he has no information about where the lime is after he exits the cellar. + +Alexander did not move the lime, but he exited the cellar after Elizabeth and before Nathan and Owen. He might have overheard Elizabeth's conversation with Jackson about the lime's location, but we cannot be sure. + +Elizabeth moved the lime from the blue_crate to the green_pantry before exiting the cellar. She might have shared this information with Alexander, but we cannot be sure. + +Jackson lost his watch in the cellar and likes the blue_suitcase in the workshop, but he has no information about the lime's location. + +Based on this analysis, we cannot confidently determine where Nathan thinks Owen thinks Alexander thinks Elizabeth thinks the lime is. The question is asking for a chain of thoughts that involves multiple agents and their assumptions, but we do not have enough information to trace this chain. The correct answer is therefore unknown and cannot be determined from the given story and assumptions. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_19/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a01ef8e12388435750ccab5d6b6388fca8f2dc14 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_19/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where is the pear really? +Answer: blue_crate +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To answer this question, we need to track the movements of the pear and the agents who interacted with it. According to the story, the pear was initially in the blue_crate (statement 2). Jack moved the pear to the blue_drawer (statement 6), then William moved it to the green_crate (statement 9), and finally Aiden moved it back to the blue_crate (statement 14). Therefore, the pear is in the blue_crate (option L). The correct answer is L. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_19/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a9fa26650766506e297c744544533291237b6211 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_19/order_1.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does Noah really think the pear is? +Answer: blue_crate +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: Step 1: Look for any information related to Noah's movements or actions regarding the pear. + +Step 2: Trace the movements of the pear and see if Noah was present in any of those places. + +Step 3: Use the assumption that agents tend to lie and that their claims don't reflect their actual thoughts. + +Step 4: Use the assumption that agents tend to trust those who exited the room later than themselves. + +Based on the story and assumptions, we can see that Noah moved the pear to the blue_suitcase and then exited the playroom. Later, William moved the pear to the green_crate and then exited the playroom. Finally, Aiden moved the pear to the blue_crate and then exited the playroom. Noah was not present in any of these movements, so we cannot trust his claims about the pear's location. However, we do know that William exited the playroom after Noah, so if Noah were to trust anyone, it would be William. Therefore, we can conclude that Noah really thinks the pear is in the green_crate, which is where William moved it. The answer is B. green_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_19/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..57207aebbdca4e1dfa946d12dd1b0f7642a38eba --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_19/order_2.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does William think Noah thinks the pear is? +Answer: green_crate +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: To answer this question, we need to track the movements of William and Noah with respect to the pear. According to the story, William moved the pear to the green_crate and then exited the playroom. Noah then moved the pear to the blue_suitcase before exiting the playroom. William did not re-enter the playroom after Noah's exit. Therefore, William would not have any information about Noah's movements after he left the playroom. + +Since William did not witness Noah moving the pear to the blue_suitcase, he would not have any reason to think that Noah thinks the pear is in the blue_suitcase. Therefore, the answer is not K. + +William moved the pear to the green_crate, so he knows that the pear is not in the blue_crate (M) or the blue_drawer (N). He also did not witness anyone else moving the pear to the blue_pantry (C) or the green_drawer (B). Therefore, he would not have any reason to think that Noah thinks the pear is in any of these locations. + +The remaining options are red_pantry (A), blue_bucket (D), green_box (E), green_bathtub (F), red_bottle (G), red_crate (H), red_envelope (I), blue_cupboard (J), and green_basket (O). There is no information in the story to suggest that the pear is in any of these locations, so we cannot determine where William thinks Noah thinks the pear is. + +Therefore, the answer is none of the above. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_19/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f9c9a0037bd87d00d629fb468f0cf9b51b5098e7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_19/order_3.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does Isabella think William thinks Noah thinks the pear is? +Answer: blue_crate +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To answer this question, we need to track the movements of Isabella, William, and Noah with respect to the pear. Isabella entered the playroom with the group, made no movements, and exited the playroom. William moved the pear to the green_crate and then exited the playroom. Noah moved the pear to the blue_suitcase and then exited the playroom. + +Isabella did not witness William moving the pear to the green_crate, but she did witness Noah moving the pear to the blue_suitcase. Therefore, Isabella knows that the pear is currently in the blue_suitcase. + +We don't know where William thinks the pear is, but we do know that he dislikes peas (not relevant to the question). We also don't know where Noah thinks the pear is, but we do know that he lost his phone (also not relevant to the question). + +So, the answer to the question is: Isabella thinks that William thinks that Noah thinks the pear is in the blue_suitcase. Therefore, the answer is K. blue_suitcase. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_19/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1c62ea955314a0607c6c27f4dbc9229f4d2029e1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_19/order_4.txt @@ -0,0 +1,58 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does Aiden think Isabella thinks William thinks Noah thinks the pear is? +Answer: blue_crate +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: First, we need to determine the order of exits from the playroom. Isabella exited first, followed by Jack, then William, then Noah, and finally Aiden. + +Next, we need to track the movements of the pear. It started in the blue_crate, was moved to the blue_drawer by Jack, then to the green_crate by William, and finally to the blue_suitcase by Noah. + +Based on the assumption that agents tend to trust those who exited the room later than themselves, Aiden would trust Noah's judgment the most since he was the last to exit the playroom. + +Noah moved the pear to the blue_suitcase, so Aiden thinks that Noah thinks the pear is in the blue_suitcase. + +Isabella made no movements or interactions related to the pear, so her thoughts on the pear's location are irrelevant to the question. + +William moved the pear to the green_crate, but Aiden would not trust his judgment as much as Noah's since William exited the playroom before Noah. + +Therefore, the answer is C. blue_pantry, which was not one of the options given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_2/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0d4f878b76878b51a2fc6f56f64bb119cc6fa2ec --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_2/order_0.txt @@ -0,0 +1,67 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where is the onion really? +Answer: blue_bottle +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bottle +GPT-4 Explain: Step 1: Look for any statements related to the location of the onion. +- Statement 2: The onion is in the blue_treasure_chest. +- Statement 5: Charlotte moved the onion to the green_treasure_chest. +- Statement 7: Owen moved the onion to the red_drawer. +- Statement 28: The onion is in the red_drawer. + +Step 2: Determine which statement is true based on the given assumptions. +- Since the agents tend to lie, we cannot trust their statements at face value. +- However, we can use the exit order to determine who might be more trustworthy. +- According to assumption 4, an agent tends to trust another agent who exited the room later than himself. +- Based on statement 2, Emily, Charlotte, Owen, Nathan, and Liam were all in the attic when the onion was first introduced. +- Emily made no movements and stayed in the attic for 1 minute before exiting. +- Charlotte moved the onion to the green_treasure_chest and then exited. +- Owen moved the onion to the red_drawer and then exited. +- Nathan made no movements and stayed in the attic for 1 minute before exiting. +- Liam made no movements and stayed in the attic for 1 minute before exiting. +- Based on assumption 1, we can assume that the agent who exited the attic last witnessed all the movements related to the onion. +- According to statement 28, the onion is in the red_drawer. +- Therefore, the answer is N. red_drawer. + +a: 5 1 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_2/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1953c8a5b033e59081200eb13b39c9563f6f861a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_2/order_1.txt @@ -0,0 +1,55 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Nathan really think the onion is? +Answer: blue_bottle +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bottle +GPT-4 Explain: To answer this question, we need to track the movements of the onion and the agents' thoughts. According to the story, Emily, Charlotte, Owen, Nathan, and Liam entered the attic together. The onion was initially in the blue_treasure_chest, but it was later moved to the green_treasure_chest by Charlotte, and then to the red_drawer by Owen. Nathan made no movements while in the attic, but he lost his gloves there. + +Later, Charlotte, Owen, Liam, and Nathan entered the attic together again. The onion was in the red_drawer, but Owen moved it to the blue_bottle before they all exited the attic. + +Based on the assumptions given, we know that Nathan's actual thought may not match what he tells others, and that he may trust the thoughts of agents who exited the room later than him. + +Since Nathan made no movements with the onion while in the attic, we can assume that he did not know where the onion was moved to. However, since Owen moved the onion to the blue_bottle after Nathan left the attic, Nathan may trust Owen's thought that the onion is in the blue_bottle. Therefore, the answer is O. blue_bottle. + +a: \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_2/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..476564a9aa29e98340a765ab545837fa6ccec04a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_2/order_2.txt @@ -0,0 +1,55 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Emily think Nathan thinks the onion is? +Answer: blue_container +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to track the movements of the onion and the agents' exits from the attic. According to the story, Emily was the first to enter the attic and made no movements before exiting. Charlotte moved the onion from the blue_treasure_chest to the green_treasure_chest before exiting. Owen then moved the onion to the red_drawer before exiting. Nathan made no movements before exiting, and Liam made no movements before exiting. + +Later, Emily moved the lemon from the red_bottle to the blue_container before exiting the front yard. Charlotte then moved the lemon to the blue_crate before exiting the front yard, and Liam moved the lemon to the green_drawer before exiting the front yard. + +After some time, Charlotte, Owen, Liam, and Nathan entered the attic together. Charlotte made no movements before exiting, and Owen moved the onion to the blue_bottle before exiting. Liam made no movements before exiting, and Nathan made no movements before exiting. + +Based on the assumption that agents tend to trust those who exited the room later than themselves, we can assume that Emily trusts Nathan more than Charlotte or Owen. Since Emily did not move the onion and Nathan made no movements in the attic, Emily would likely think that Nathan still believes the onion is in the last place it was moved to, which is the red_drawer. Therefore, the answer is N. red_drawer. + +a: 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_2/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b57d067ec267cdbde5479ad5f22517217f306420 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_2/order_3.txt @@ -0,0 +1,59 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Owen think Emily thinks Nathan thinks the onion is? +Answer: blue_container +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To solve this question, we need to track the movements of the agents and their thoughts about the onion's location. + +First, Emily, Charlotte, Owen, Nathan, and Liam entered the attic. Emily made no movements and stayed in the attic for 1 minute before exiting. Then, Charlotte moved the onion from the blue_treasure_chest to the green_treasure_chest and exited the attic. Owen moved the onion from the green_treasure_chest to the red_drawer and exited the attic. Nathan made no movements and stayed in the attic for 1 minute before exiting. Liam made no movements and stayed in the attic for 1 minute before exiting. + +Later, Charlotte, Owen, Liam, and Nathan entered the attic again. The onion was in the red_drawer. Charlotte made no movements and stayed in the attic for 1 minute before exiting. Owen moved the onion from the red_drawer to the blue_bottle and exited the attic. Liam made no movements and stayed in the attic for 1 minute before exiting. + +Based on the assumptions given, we know that Owen can only infer Nathan's thoughts if they were in the same place or had private or public interactions. Nathan made no movements in the attic, so he did not interact with Owen. Therefore, Owen cannot infer Nathan's thoughts about the onion's location. + +However, Owen can infer Emily's thoughts about Nathan's thoughts. Emily was in the attic before Charlotte moved the onion to the green_treasure_chest. Therefore, Emily would have thought the onion was in the blue_treasure_chest. After Emily left the attic, Charlotte moved the onion to the green_treasure_chest, and Owen moved it to the red_drawer. + +So, Owen would think that Emily thinks Nathan thinks the onion is in the blue_treasure_chest. Therefore, the answer is K. blue_treasure_chest. + +a: 5 6 7 9 2 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_2/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..15753739b296b37c421821d707f6d1df5cce3e85 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_2/order_4.txt @@ -0,0 +1,61 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Liam think Owen thinks Emily thinks Nathan thinks the onion is? +Answer: blue_container +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Liam thinks: We need to start with Liam's perspective. According to the story, Liam saw a dog after exiting the attic, but there is no information about what he thinks about the onion's location. Therefore, we don't have any clues about Liam's thoughts on this matter. + +2. Owen thinks: Owen moved the onion from the red_drawer to the blue_bottle in the attic. Therefore, he knows that the onion is not in the red_drawer anymore. However, he doesn't know that Charlotte moved the onion to the green_treasure_chest before he entered the waiting_room. Therefore, he might think that the onion is still in the red_drawer. + +3. Emily thinks: Emily made no movements in the attic and didn't interact with the onion. Therefore, she doesn't have any information about the onion's location. + +4. Nathan thinks: Nathan made no movements in the attic and didn't interact with the onion. Therefore, he doesn't have any information about the onion's location. + +5. Putting it all together: Liam thinks that Owen thinks that the onion is in the blue_bottle (since Owen moved it there). However, Owen might actually think that the onion is still in the red_drawer (since he didn't witness Charlotte moving it to the green_treasure_chest). Emily and Nathan don't have any thoughts about the onion's location. + +Therefore, the answer is O. blue_bottle. + +a: 2 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_20/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..97a535ad4b9f12b7800425c6cc592e3efbe0fabc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_20/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where is the spinach really? +Answer: blue_treasure_chest +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: To answer this question, we need to track the movements of the agents and where they placed the spinach. According to the story, the spinach was initially in the green_drawer when all five agents entered the living_room. Elizabeth moved the spinach to the green_pantry, then Evelyn moved it to the red_container. Noah moved it back to the green_drawer, and finally, Elizabeth moved it to the blue_treasure_chest. Therefore, the correct answer is option K. blue_treasure_chest. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_20/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..89b1a5bf847740ffa827496b833814dcf3907db2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_20/order_1.txt @@ -0,0 +1,61 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Evelyn really think the spinach is? +Answer: blue_treasure_chest +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: Step 1: Look for any information related to Evelyn's movements or actions regarding the spinach. + +Step 2: Trace Evelyn's movements and interactions with other agents to determine if she had any private or public interactions related to the spinach. + +Step 3: Use the assumption that agents tend to lie and that their claims do not reflect their actual thoughts to eliminate any options that may be false. + +Step 4: Use the assumption that agents tend to trust those who exited the room later than themselves to determine if any of the remaining options are more likely to be true. + +Based on the story and assumptions, we can determine that Evelyn moved the spinach to the red_container, but she may not actually think that is where it is. Therefore, we need to look for any private or public interactions that may reveal her true thoughts. + +There are no private interactions related to the spinach, but we do know that Evelyn lost her phone and saw a cat. These events are not related to the spinach, so we can eliminate any options that may be related to them. + +There are also no public interactions related to the spinach, so we cannot use this information to determine Evelyn's true thoughts. + +Therefore, we cannot determine where Evelyn really thinks the spinach is based on the given information. The answer is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_20/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b3a299bd94f93af988a1d07be11b18cf775d3352 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_20/order_2.txt @@ -0,0 +1,79 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Jackson think Evelyn thinks the spinach is? +Answer: green_cupboard +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_cupboard +GPT-4 Explain: Step 1: Identify the relevant information in the story. +- Jackson, Elizabeth, Evelyn, Liam, and Noah entered the living room. +- The spinach was initially in the green drawer. +- Jackson made no movements and stayed in the living room for 1 minute before exiting. +- Elizabeth moved the spinach to the green pantry and then exited. +- Evelyn moved the spinach to the red container and then lost his phone before exiting. +- Liam made no movements and stayed in the living room for 1 minute before exiting. +- Noah moved the spinach back to the green drawer before exiting. +- Elizabeth lost her watch. +- Jackson, Elizabeth, Evelyn, Liam, and Noah entered the waiting room. +- Liam, Jackson, and Evelyn entered the dining room. +- The sweet potato was initially in the red crate. +- Liam moved the sweet potato to the blue bucket. +- Evelyn saw a cat. +- Jackson moved the sweet potato to the blue container before exiting. +- Liam, Jackson, and Evelyn entered the waiting room. +- Liam, Jackson, Elizabeth, and Evelyn entered the living room. +- The spinach was in the green drawer. +- Liam made no movements and stayed in the living room for 1 minute before exiting. +- Jackson moved the spinach to the green cupboard and likes the blue bathtub before exiting. +- Elizabeth moved the spinach to the blue treasure chest before exiting. +- Evelyn made no movements and stayed in the living room for 1 minute before exiting and likes the green pantry. +- Liam, Jackson, Elizabeth, and Evelyn entered the waiting room. + +Step 2: Determine the thought process of each character regarding the location of the spinach. +- Jackson: Initially, the spinach was in the green drawer. After he left the living room, Elizabeth moved it to the green pantry, then Evelyn moved it to the red container, and finally, Noah moved it back to the green drawer. When Jackson returned to the living room, the spinach was in the green drawer again. Later, he moved it to the green cupboard. +- Elizabeth: Initially, the spinach was in the green drawer. She moved it to the green pantry before leaving the living room. She did not return to the living room before the end of the story. +- Evelyn: Initially, the spinach was in the green drawer. He moved it to the red container before losing his phone and leaving the living room. He did not return to the living room before the end of the story. +- Liam: Initially, the spinach was in the green drawer. He made no movements and stayed in the living room for 1 minute before leaving. Later, he moved the sweet potato from the red crate to the blue bucket in the dining room. When he returned to the living room, he made no movements and stayed for 1 minute before leaving again. +- Noah: Initially, the spinach was in the green drawer. He moved it back to the green drawer before leaving the living room. He did not return to the living room before the end of the story. + +Step 3: Determine where Jackson thinks Evelyn thinks the spinach is. +- Jackson and Evelyn were both in the living room when the spinach was moved from the green drawer to the red container. However, Jackson left the living room before Evelyn moved the spinach to the red container. Therefore, Jackson would trust Evelyn's claim about the location of the spinach only if Evelyn exited the living room after him. According to the story, Evelyn exited the living room before Liam, Jackson, and Noah entered the waiting room. Therefore, Jackson would not trust Evelyn's claim about the location of the spinach. Instead, he would likely assume that Evelyn still thinks the spinach is in the red container, where he left it before losing his phone. Therefore, the answer is N. red_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_20/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..fb1230f6ed15d0ff011ff48147fd479dc227ba0f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_20/order_3.txt @@ -0,0 +1,63 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Liam think Jackson thinks Evelyn thinks the spinach is? +Answer: green_drawer +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: To answer this question, we need to track the movements and thoughts of Liam, Jackson, and Evelyn regarding the spinach. + +1. All five agents entered the living room where the spinach was located in the green drawer. +2. Jackson made no movements and stayed in the living room for 1 minute before exiting. +3. Elizabeth moved the spinach to the green pantry and then exited. +4. Evelyn moved the spinach to the red container and then exited, but lost his phone. +5. Liam made no movements and stayed in the living room for 1 minute before exiting. +6. Noah moved the spinach back to the green drawer and then exited. +7. Elizabeth lost her watch. +8. Liam, Jackson, Evelyn, and Elizabeth entered the living room again where the spinach was still in the green drawer. +9. Liam made no movements and stayed in the living room for 1 minute before exiting. +10. Jackson moved the spinach to the green cupboard and likes the blue bathtub before exiting. +11. Elizabeth moved the spinach to the blue treasure chest before exiting. +12. Evelyn made no movements and stayed in the living room for 1 minute before exiting. +13. Liam, Jackson, Evelyn, and Elizabeth entered the waiting room. + +Based on these movements, we can determine that Liam thinks Jackson thinks Evelyn thinks the spinach is in the green pantry (M). This is because Jackson moved the spinach to the green cupboard (not the green pantry) and Liam was not present to witness this movement. However, Liam knows that Jackson exited the living room after him and therefore trusts his judgment more than Evelyn's. Evelyn moved the spinach to the red container and then lost his phone, which may make Liam doubt his reliability. Therefore, Liam is more likely to trust Jackson's thoughts on the location of the spinach. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_20/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0f9949c50dd8afc48d0097004a7326e2b4cb6280 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_20/order_4.txt @@ -0,0 +1,55 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Elizabeth think Liam thinks Jackson thinks Evelyn thinks the spinach is? +Answer: green_drawer +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: This is a complex question that requires careful analysis of the story and the assumptions given. We need to track the movements of each character and their interactions to determine where Elizabeth thinks Liam thinks Jackson thinks Evelyn thinks the spinach is. + +First, we know that the spinach was initially in the green_drawer when all five characters entered the living_room. Jackson made no movements and stayed in the living_room for 1 minute before exiting. Elizabeth moved the spinach to the green_pantry before exiting. Evelyn then moved the spinach to the red_container before losing his phone and exiting. Liam made no movements and stayed in the living_room for 1 minute before exiting. Finally, Noah moved the spinach back to the green_drawer before exiting. + +Later on, Liam, Jackson, Elizabeth, and Evelyn entered the living_room again and the spinach was still in the green_drawer. Jackson moved the spinach to the green_cupboard before exiting and Elizabeth moved it to the blue_treasure_chest before exiting. Evelyn made no movements and stayed in the living_room for 1 minute before exiting. + +Based on these movements, we can determine that Elizabeth thinks Liam thinks Jackson thinks the spinach is in the blue_treasure_chest. This is because Elizabeth was the last one to move the spinach before Liam entered the living_room and Liam made no movements before exiting. Jackson moved the spinach to the green_cupboard after Liam left, so Liam would not have seen the spinach in the green_cupboard. Therefore, Elizabeth would assume that Liam thinks the spinach is still in the blue_treasure_chest where she left it. + +Therefore, the answer is K. blue_treasure_chest. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_3/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4883862ec1bacf967f58c8dcbc9387df0314e3e1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_3/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where is the peas really? +Answer: blue_cupboard +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: To answer this question, we need to track the movements of the agents and the location of the peas. Mila initially moved the peas from the green_treasure_chest to the blue_bucket. Then, Carter moved the peas from the blue_bucket to the green_bucket. Finally, Amelia moved the peas from the green_bucket to the blue_cupboard. Therefore, the correct answer is E. blue_cupboard. + +a: \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_3/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fc1db1a7763fd982710a207e3d20011d860785ef --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_3/order_1.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Isla really think the peas is? +Answer: blue_cupboard +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: To answer this question, we need to look at the movements of each agent and their possible interactions. Mila moved the peas from the green_treasure_chest to the blue_bucket, and Amelia moved them from the blue_bucket to the blue_cupboard. Carter moved the watermelon from the blue_bucket to the green_bucket. Isla made no movements in the staircase, but she was in the same room as Carter who moved the peas to the green_bucket. Emma made no movements in the study, so she has no information about the location of the peas. + +Based on the assumption that agents tend to lie, we cannot trust what Isla says about the location of the peas. However, we can infer her actual thought based on her interactions with other agents. Isla was in the same room as Carter who moved the peas to the green_bucket, and she made no movements to suggest that she moved the peas elsewhere. Therefore, Isla really thinks that the peas are in the green_bucket. + +The answer is C. green_bucket. + +a: 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_3/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c5cd9fcdb441b525c10615e674e1ebf670287251 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_3/order_2.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Amelia think Isla thinks the peas is? +Answer: green_bucket +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: Step 1: Identify the agents involved in the movement of the peas - Mila, Carter, Isla, and Amelia. + +Step 2: Identify the movements of the peas - Mila moved the peas to the blue_bucket, and then Amelia moved the peas to the blue_cupboard. + +Step 3: Identify the movements of Isla - Isla made no movements in the first staircase, and then Isla moved the lemon to the green_cupboard in the study. + +Step 4: Identify the interactions between Amelia and Isla - There is no mention of any private or public interactions between Amelia and Isla. + +Step 5: Use the assumptions to determine where Amelia thinks Isla thinks the peas is - Since there is no interaction between Amelia and Isla, Amelia cannot infer Isla's thoughts. Therefore, the answer is impossible to determine based on the given information. + +Answer: Cannot be determined. + +a: 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_3/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..509e3afd76eb2da7632d7766fcb59b1dca619eaf --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_3/order_3.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Carter think Amelia thinks Isla thinks the peas is? +Answer: green_bucket +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: To answer this question, we need to trace the movements of the characters and their interactions. Mila moved the peas from the green_treasure_chest to the blue_bucket, and then Amelia moved the peas from the blue_bucket to the blue_cupboard. Carter moved the watermelon from the blue_bucket to the green_bucket. Isla made no movements related to the peas. Emma made no movements related to the peas. + +Since Amelia moved the peas to the blue_cupboard, it is likely that she thinks the peas are in the blue_cupboard. However, we need to determine what Carter thinks Amelia thinks Isla thinks. + +Carter and Amelia were both in the study together, but there is no indication that they had any private or public interactions related to the peas. Therefore, Carter cannot infer what Amelia thinks about the location of the peas based on their time in the study together. + +The only other time that Carter and Amelia were in the same room together was when they entered the waiting_room with Mila, Isla, and Emma. However, there is no indication that they had any private or public interactions related to the peas during this time. + +Therefore, we cannot determine where Carter thinks Amelia thinks Isla thinks the peas is. The answer is unknown. + +a: 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_3/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1a28b1521d2ef0516166bce1efc3a2cc0cd6de05 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_3/order_4.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Mila think Carter thinks Amelia thinks Isla thinks the peas is? +Answer: blue_bucket +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bucket +GPT-4 Explain: To answer this question, we need to track the movements of the peas and the agents' thoughts. Mila moved the peas from the green_treasure_chest to the blue_bucket, and Amelia moved them from the blue_bucket to the blue_cupboard. Carter moved the watermelon from the blue_bucket to the green_bucket. Isla made no movements related to the peas or watermelon. Emma made no movements related to the peas or watermelon. + +Since Mila moved the peas to the blue_bucket, we know that Mila thinks the peas are in the blue_bucket. However, we need to determine where Carter thinks Amelia thinks Isla thinks the peas are. + +We know that Amelia moved the peas to the blue_cupboard, but we don't know if Carter is aware of this. Isla made no movements related to the peas, so we can't infer her thoughts on their location. Therefore, we need to determine if Carter thinks the peas are still in the green_bucket or if he thinks they were moved to the blue_cupboard. + +Since Carter exited the staircase after Mila, Mila may trust his thoughts more than Isla's or Emma's. However, we don't have any information about private or public interactions between Mila and Carter that would allow Mila to infer Carter's thoughts. + +Therefore, we cannot determine where Mila thinks Carter thinks Amelia thinks Isla thinks the peas are. The answer is unknown. + +a: 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_4/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..56476f4f8fdd6264df2dceef59c08f0812246581 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_4/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where is the green_pepper really? +Answer: blue_container +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to track the movements of the agents and the location of the green pepper. According to the story, the green pepper was initially in the red basket (statement 2), but Jackson moved it to the blue container (statement 3). We don't have any further information about the green pepper's location after that. Therefore, the answer is G. blue_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_4/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..51c560a471892f923484202d38dec7afe2d62f85 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_4/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Emma really think the green_pepper is? +Answer: blue_container +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to trace Emma's movements and any interactions she had with other agents regarding the location of the green pepper. According to the story, Emma made no movements in the living room and did not interact with any other agents regarding the green pepper. Therefore, we cannot determine where Emma really thinks the green pepper is based on the given information. The answer is not provided in the options given. The correct answer is "Cannot be determined." \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_4/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ab6b2bb224e8744321316e9121fba492c8c26868 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_4/order_2.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Benjamin think Emma thinks the green_pepper is? +Answer: blue_container +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to track the movements of Benjamin and Emma and the location of the green pepper. According to the story, Jackson moved the green pepper from the red basket to the blue container while all five agents were in the living room. Benjamin then saw a cat and exited the living room, while Emma stayed in the living room for one minute before exiting. Later, Benjamin, Emma, and Abigail entered the bedroom where they found the grapes in the red bottle. Benjamin then moved the grapes to the green bathtub before exiting the bedroom. Emma stayed in the bedroom for one minute before exiting. + +There is no mention of Emma making any movements related to the green pepper, so we cannot determine where she thinks it is. However, we do know that Benjamin did not witness Jackson moving the green pepper to the blue container, so he may not know its current location. We also know that Benjamin moved the grapes to the green bathtub, which is not related to the location of the green pepper. + +Therefore, we cannot determine where Benjamin thinks Emma thinks the green pepper is based on the given information. The answer is not provided in the multiple-choice options. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_4/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4badf9858cb83ad4a657f307fc20f7308af7d8a8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_4/order_3.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Jackson think Benjamin thinks Emma thinks the green_pepper is? +Answer: blue_container +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to trace the movements of Jackson, Benjamin, and Emma regarding the green pepper. Jackson initially moved the green pepper from the red basket to the blue container in the living room. Benjamin did not make any movements in the living room and only saw a cat. Emma also did not make any movements in the living room and only liked the blue bottle in the waiting room. + +Since Benjamin did not witness Jackson moving the green pepper, he cannot know its current location. However, Emma was in the living room when Jackson moved the green pepper to the blue container. Therefore, Emma knows that the green pepper is in the blue container. + +Now, we need to determine where Jackson thinks Benjamin thinks Emma thinks the green pepper is. Since Benjamin did not witness the movement of the green pepper, he cannot have any thoughts about its current location. However, Emma knows that the green pepper is in the blue container. Therefore, Jackson thinks that Benjamin thinks Emma thinks the green pepper is in the blue container. + +The answer is G. blue_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_4/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8c7f61e0ed245ed974b5ccc94327ff135a675a72 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_4/order_4.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Abigail think Jackson thinks Benjamin thinks Emma thinks the green_pepper is? +Answer: blue_container +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Abigail thinks: We need to consider what Abigail knows about the location of the green pepper. According to the story, Jackson moved the green pepper from the red basket to the blue container. Abigail was in the living room when this happened, so she knows that the green pepper is in the blue container. + +2. Jackson thinks: We need to consider what Jackson knows about the location of the green pepper and what he might be thinking. Jackson moved the green pepper to the blue container, so he knows that it is there. However, we don't have any information about what he might be thinking about the green pepper. + +3. Benjamin thinks: We need to consider what Benjamin knows about the location of the green pepper and what he might be thinking. Benjamin saw a cat in the living room, but we don't have any information about what he knows or thinks about the green pepper. + +4. Emma thinks: We need to consider what Emma knows about the location of the green pepper and what she might be thinking. We know that Emma likes the blue bottle, but we don't have any information about what she knows or thinks about the green pepper. + +5. Putting it all together: Abigail thinks that Jackson thinks that Benjamin thinks that Emma thinks the green pepper is in the blue container. This is because Abigail knows that the green pepper is in the blue container, and she trusts Jackson's movements because he exited the living room after her. Benjamin and Emma did not move the green pepper, so Abigail cannot infer their thoughts about its location. Therefore, the answer is G. blue_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_5/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c8521bee80743e0fb108c69c102148f2d2008e3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_5/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where is the peas really? +Answer: blue_bathtub +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: To answer this question, we need to track the movements of each agent and their interactions with the peas. According to the story, the peas were initially in the green_basket when all five agents entered the patio. Mila and Amelia made no movements and exited the patio after one minute each. Jackson also made no movements and exited the patio after one minute, but we know that he likes the green_bathtub, not the green_basket where the peas were located. Hannah moved the peas to the blue_bathtub before exiting the patio. Abigail made no movements and exited the patio after one minute. + +Therefore, based on the story, the peas are in the blue_bathtub. The answer is O. blue_bathtub. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_5/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0abe2947ee0fb67572b5292a9ddbdf7b2f2b4c39 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_5/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Hannah really think the peas is? +Answer: blue_bathtub +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: To answer this question, we need to look for any information related to where Hannah thinks the peas is. According to the story, Hannah moved the peas to the blue_bathtub, but there is no information about where she thinks the peas is. Therefore, we cannot determine the answer based on the given information. The correct answer is not provided in the options. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_5/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..40614b21db6f733d99e883b8fe8533ddb213ae94 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_5/order_2.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Amelia think Hannah thinks the peas is? +Answer: green_basket +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: To answer this question, we need to track the movements of Amelia and Hannah and the location of the peas. According to the story, Hannah moved the peas to the blue_bathtub, and then later moved the lemon to the red_envelope. Amelia was in the patio and then entered the lounge with Hannah and Mila. She then moved the lemon to the blue_container before exiting the lounge. + +There is no information in the story about Amelia and Hannah having any private or public interactions, so we cannot infer Amelia's thoughts about where Hannah thinks the peas is based on their conversations. However, we do know that Amelia exited the lounge before Hannah moved the lemon to the red_envelope, so Hannah would not have been able to tell Amelia where she moved the peas to. + +Therefore, the answer to the question is not provided in the story and cannot be determined. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_5/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6258ec69f924840c76406eaa640d6af53d6d0ee3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_5/order_3.txt @@ -0,0 +1,61 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Jackson think Amelia thinks Hannah thinks the peas is? +Answer: green_basket +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: To solve this question, we need to trace the movements of Jackson, Amelia, and Hannah and their interactions. + +- Jackson entered the patio and made no movements before exiting. +- Amelia entered the patio and made no movements before exiting. +- Hannah entered the patio and moved the peas to the blue_bathtub before exiting. +- Jackson likes the green_bathtub. +- Hannah, Amelia, and Mila entered the lounge and moved the lemon to different places before exiting. +- Mila moved the lemon to the green_box. +- Hannah likes the green_crate. +- Jackson entered the closet and made no movements before exiting. +- Hannah, Abigail, Mila, and Jackson entered the waiting_room. + +Based on these movements, we can infer that Jackson and Amelia did not have any interactions or were not in the same place at the same time. Therefore, Jackson cannot infer what Amelia thinks about the location of the peas. + +Hannah moved the peas to the blue_bathtub, but we don't know what she thinks about the location of the peas. + +Therefore, the answer to the question is not determinable based on the given information. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_5/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..730d0b457033746b7e7dd0df2aad810b3eae01c6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_5/order_4.txt @@ -0,0 +1,116 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Abigail think Jackson thinks Amelia thinks Hannah thinks the peas is? +Answer: green_basket +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Abigail was in the patio with Jackson, Amelia, Mila, and Hannah when they entered. +2. The peas is in the green_basket. +3. Mila made no movements and stayed in the patio for 1 minute. +4. Mila exited the patio. +5. Amelia made no movements and stayed in the patio for 1 minute. +6. Amelia exited the patio. +7. Jackson made no movements and stayed in the patio for 1 minute. +8. Jackson exited the patio. +9. Jackson likes the green_bathtub. +10. Hannah moved the peas to the blue_bathtub. +11. Hannah exited the patio. + +Based on these steps, we know that Abigail was in the same place as Jackson, Amelia, Mila, and Hannah when they entered the patio. We also know that the peas was originally in the green_basket, but Hannah moved it to the blue_bathtub. We don't have any information about what Abigail thinks about the location of the peas at this point. + +To continue, we need to look at the actions of the other agents: + +12. Abigail made no movements and stayed in the patio for 1 minute. +13. Abigail exited the patio. +14. Mila, Amelia, Jackson, Hannah, and Abigail entered the waiting_room. +15. Hannah, Amelia, and Mila entered the lounge. +16. The lemon is in the blue_cupboard. +17. Hannah moved the lemon to the red_envelope. +18. Hannah exited the lounge. +19. Amelia moved the lemon to the blue_container. +20. Amelia exited the lounge. +21. Jackson dislikes the beans. +22. Mila moved the lemon to the green_box. +23. Hannah likes the green_crate. +24. Mila exited the lounge. +25. Hannah, Amelia, and Mila entered the waiting_room. + +At this point, Abigail has not interacted with any of the other agents since leaving the patio. However, we do know that Hannah moved the lemon from the blue_cupboard to the red_envelope, and then Amelia moved it to the blue_container. We also know that Mila moved the lemon to the green_box, and that Hannah likes the green_crate. None of this information is directly related to the location of the peas, but it may be useful in making inferences. + +Let's continue: + +26. Hannah, Abigail, Mila, and Jackson entered the closet. +27. The sweet_potato is in the red_bucket. +28. Hannah moved the sweet_potato to the green_cupboard. +29. Hannah exited the closet. +30. Abigail made no movements and stayed in the closet for 1 minute. +31. Abigail exited the closet. +32. Mila made no movements and stayed in the closet for 1 minute. +33. Mila exited the closet. +34. Jackson made no movements and stayed in the closet for 1 minute. +35. Jackson exited the closet. +36. Hannah, Abigail, Mila, and Jackson entered the waiting_room. + +Now we have some new information: the sweet_potato is in the red_bucket, but Hannah moved it to the green_cupboard. We also know that Abigail, Mila, and Jackson were in the closet together, but we don't have any information about what they discussed. + +Based on all of this information, we can make some inferences about what Abigail might think about where Jackson thinks Amelia thinks Hannah thinks the peas is. Here's our reasoning: + +- Abigail was in the same place as Jackson, Amelia, Mila, and Hannah when they entered the patio, but we don't have any information about what they discussed or what Abigail thinks about the location of the peas. +- Hannah moved the lemon from the blue_cupboard to the red_envelope, and then Amelia moved it to the blue_container. Mila then moved it to the green_box. This suggests that the agents are capable of moving objects around and that they may have different opinions about where things should be located. +- Hannah moved the sweet_potato from the red_bucket to the green_cupboard. This suggests that Hannah is willing to move objects around and that she may have a preference for where things should be located. +- Jackson likes the green_bathtub, but we don't have any information about what he thinks about the location of the peas. +- Abigail, Mila, and Jackson were in the closet together, but we don't have any information about what they discussed or what Abigail thinks about the location of the peas. + +Based on all of this, we can't say for certain where Abigail thinks Jackson thinks Amelia thinks Hannah thinks the peas is. However, we can make some educated guesses based on the available information. Here are a few possibilities: + +- If Abigail trusts Jackson and believes that he has good taste, she might think that he agrees with her own preference for the green_crate, where Hannah likes to keep things. +- If Abigail thinks that Hannah is the most opinionated about where things should be located, she might assume that Jackson and Amelia defer to her judgment and think that the peas is in the blue_bathtub, where Hannah moved it. +- If Abigail thinks that the other agents are unpredictable and that they all have different opinions about where things should be located, she might not have any idea where Jackson thinks Amelia thinks Hannah thinks the peas is. + +Given these possibilities, we can't definitively answer the question without more information. However, we can eliminate some of the answer choices based on what we know: + +- We know that the peas is not in the blue_pantry, red_bucket, red_drawer, red_pantry, or green_bucket, so we can eliminate those answer choices. +- We know that Jackson likes the green_bathtub, but we don't have any information about what he thinks about the location of the peas, so we can't assume that he thinks it's in the green_basket or the green_crate. +- We know that Hannah moved the peas to the blue_bathtub, but we don't have any information about what Amelia or Jackson think about the location of the peas, so we can't assume that they think it's in the blue_bathtub or any other location. + +Based on this analysis, we can eliminate answer choices A, B, D, G, I, K, L, and O. That leaves us with answer choices E, F, H, and M as possibilities, but we can't say for certain which one is correct. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_6/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..912bec508abaffdd918b0a0f89f8a3ea271eaeac --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_6/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where is the turnip really? +Answer: blue_pantry +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: To answer this question, we need to track the movements of the turnip throughout the story. According to the story, the turnip was initially in the red_basket when Hannah, Lily, Logan, Elizabeth, and Noah entered the study. Elizabeth then moved the turnip to the green_pantry, and Noah later moved it to the red_basket again. Hannah then moved the turnip to the blue_pantry before they all left the study. Therefore, the turnip is actually in the blue_pantry. The answer is C. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_6/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..56d1d3269d6cc846f96f8c6d753dca3b22424bc0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_6/order_1.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Hannah really think the turnip is? +Answer: blue_pantry +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: To answer this question, we need to track the movements of the turnip and the agents' interactions with it. According to the story, the turnip was initially in the red_basket when all five agents entered the study. Hannah made no movements and stayed in the study for 1 minute before exiting. After Hannah, Lily and Logan also made no movements and stayed in the study for 1 minute each before exiting. Elizabeth then moved the turnip to the green_pantry before exiting. Finally, Noah moved the turnip back to the red_basket before exiting. + +Hannah was the first agent to enter the study when the turnip was in the red_basket, and she made no movements before exiting. Therefore, she must have thought that the turnip was still in the red_basket. Elizabeth moved the turnip to the green_pantry after Hannah left, so Hannah would not have known about this movement. Noah then moved the turnip back to the red_basket after Elizabeth left, so Hannah would still think that the turnip was in the red_basket. + +Therefore, the answer is A. red_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_6/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d3ee17bee38d548d6c1260562951814c3c1fa5ee --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_6/order_2.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Lily think Hannah thinks the turnip is? +Answer: red_basket +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To answer this question, we need to track the movements of Hannah and the turnip. According to the story, Hannah entered the study, made no movements, and stayed there for 1 minute before exiting. Later, Hannah entered the study again with Noah, Lily, and Elizabeth. While they were in the study, Hannah moved the turnip to the blue_pantry before exiting. + +Since Lily was in the study with Hannah when she moved the turnip, Lily knows that the turnip is not in the red_basket (where it was originally) but in the blue_pantry. Therefore, Lily thinks that Hannah thinks the turnip is in the blue_pantry. + +The answer is C. blue_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_6/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..524ade22a88f2ae3ef91002d5dadbc31ec118685 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_6/order_3.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Noah think Lily thinks Hannah thinks the turnip is? +Answer: red_basket +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To answer this question, we need to trace the movements of the agents and their thoughts about the turnip. According to the story, the turnip was initially in the red_basket in the study (step 2). Elizabeth moved it to the green_pantry (step 10), and then Noah moved it to the blue_pantry (step 32). Lily made no movements in the study (step 5), so we don't know her thoughts about the turnip. Hannah made no movements after entering the study for the first time (step 3), but she moved the turnip to the blue_pantry before exiting the study (step 32). + +Noah entered the study with Lily, Hannah, and Elizabeth (step 25) and saw that the turnip was in the red_basket (step 26). He made no movements in the study (step 28) and then exited. Lily also made no movements in the study (step 30) before exiting. + +Based on the assumptions given, we know that Noah can only infer Lily's thoughts if they had private or public interactions in the study. However, there is no mention of any private or public interactions between Noah and Lily in the study. Therefore, we cannot determine where Noah thinks Lily thinks Hannah thinks the turnip is. The answer is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_6/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..75af2757992a9ee97f1e4967b827bf4be3f80bc3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_6/order_4.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Logan think Noah thinks Lily thinks Hannah thinks the turnip is? +Answer: green_drawer +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Logan exited the study before the turnip was moved to the green_pantry by Elizabeth. +2. Logan lost his watch before entering the waiting_room with Hannah and Noah. +3. Noah moved the sweet_potato to the red_envelope before Logan moved it to the green_drawer. +4. Logan exited the dining_room before Hannah entered it and moved the turnip to the blue_pantry. +5. Noah and Lily were in the study together, but there is no information about their thoughts on the turnip. +6. Hannah was the last one to touch the turnip and moved it to the blue_pantry. + +Based on these steps, we can infer that Logan thinks Noah thinks Lily thinks Hannah thinks the turnip is in the blue_pantry. Therefore, the answer is C. blue_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_7/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6192d42eed972d16020ba5c00cd20a81be198fd0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_7/order_0.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where is the watermelon really? +Answer: red_bottle +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bottle +GPT-4 Explain: The watermelon is in which location according to the story and assumptions? +A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Step-by-step solution: +1. According to step 3, the watermelon is in the green_cupboard. +2. According to step 13, Mila moved the watermelon to the green_cupboard. +3. According to step 26, the watermelon is still in the green_cupboard. +4. Therefore, the answer is L. green_cupboard. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_7/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..09077244a169989b0a937b14f85f9211cec7108a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_7/order_1.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Evelyn really think the watermelon is? +Answer: green_cupboard +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_cupboard +GPT-4 Explain: First, we need to identify the relevant information in the story. We know that the watermelon is initially in the green_cupboard (statement 3), and then Mila moves it to an unknown location (statement 13). Later, Logan moves the watermelon to the red_bottle (statement 31). Evelyn makes no movements in the staircase where the watermelon is located (statement 27). + +Using assumption 2, we know that Evelyn can only infer the location of the watermelon if she has been in the same place as Mila or Logan, or if they have had private or public interactions. From the story, we know that Evelyn and Mila both entered and exited the staircase before Logan moved the watermelon (statements 1, 13, 15, 26, and 30). Therefore, it is possible that Mila told Evelyn where she moved the watermelon, or that Evelyn saw the watermelon in its new location before Logan moved it. + +Using assumption 3, we know that what Evelyn tells others doesn't necessarily reflect her actual thoughts. Therefore, we cannot rely on any public claims she may have made about the location of the watermelon. + +Using assumption 4, we know that Evelyn may trust Logan's claim about the location of the watermelon since he exited the staircase after her. However, we do not know if Logan made any public claims about the location of the watermelon. + +Therefore, based on the information given, we cannot definitively determine where Evelyn really thinks the watermelon is. The answer is inconclusive. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_7/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..78bac867dae19db05be847d479d55299a8cefefa --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_7/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Logan think Evelyn thinks the watermelon is? +Answer: green_cupboard +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_cupboard +GPT-4 Explain: To answer this question, we need to track the movements of Logan and Evelyn and the location of the watermelon. According to the story, Evelyn entered the staircase with Logan, Chloe, Charlotte, and Mila. She made no movements and stayed in the staircase for 1 minute before exiting. Mila moved the watermelon to the green_cupboard before exiting the staircase. Later, Logan entered the staircase with Chloe, Charlotte, and Mila. He made no movements and stayed in the staircase for 1 minute before exiting. He then moved the watermelon to the red_bottle before exiting the staircase. Finally, Evelyn entered the waiting_room with Logan, Chloe, Charlotte, and Mila. + +Based on the assumption that agents tend to trust those who exited the room later than themselves, Logan would trust Evelyn's knowledge of the watermelon's location since she exited the staircase before him. Therefore, Logan would think that Evelyn thinks the watermelon is in the green_cupboard, where Mila had placed it before Logan moved it to the red_bottle. The answer is L. green_cupboard. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_7/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5adaafe48eb03faa76a9e7206715eeefdee9d2cd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_7/order_3.txt @@ -0,0 +1,90 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Chloe think Logan thinks Evelyn thinks the watermelon is? +Answer: green_cupboard +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_cupboard +GPT-4 Explain: To answer this question, we need to track Chloe's movements and interactions with Logan and Evelyn regarding the location of the watermelon. + +1. Chloe entered the staircase with Evelyn, Charlotte, Logan, and Mila. +2. Chloe lost his gloves. +3. The watermelon is in the green_cupboard. +4. Evelyn made no movements and stayed in the staircase for 1 minute. +5. Chloe lost his watch. +6. Evelyn exited the staircase. +7. Chloe made no movements and stayed in the staircase for 1 minute. +8. Chloe exited the staircase. +9. Charlotte made no movements and stayed in the staircase for 1 minute. +10. Charlotte exited the staircase. +11. Logan made no movements and stayed in the staircase for 1 minute. +12. Logan exited the staircase. +13. Mila moved the watermelon to the green_cupboard. +14. Mila exited the staircase. +15. Evelyn, Chloe, Charlotte, Logan, and Mila entered the waiting_room. +16. Charlotte, Logan, and Chloe entered the staircase. +17. The lemon is in the red_pantry. +18. Charlotte made no movements and stayed in the staircase for 1 minute. +19. Charlotte exited the staircase. +20. Logan made no movements and stayed in the staircase for 1 minute. +21. Logan exited the staircase. +22. Chloe moved the lemon to the green_cupboard. +23. Chloe exited the staircase. +24. Charlotte, Logan, and Chloe entered the waiting_room. +25. Evelyn, Mila, Logan, and Chloe entered the staircase. +26. The watermelon is in the green_cupboard. +27. Evelyn made no movements and stayed in the staircase for 1 minute. +28. Evelyn exited the staircase. +29. Mila made no movements and stayed in the staircase for 1 minute. +30. Mila exited the staircase. +31. Logan moved the watermelon to the red_bottle. +32. Logan exited the staircase. +33. Chloe made no movements and stayed in the staircase for 1 minute. +34. Chloe exited the staircase. +35. Evelyn, Mila, Logan, and Chloe entered the waiting_room. + +Based on the story and assumptions, Chloe can only infer Logan's thoughts if they were in the same place or had private or public interactions. + +The only time Chloe and Logan were in the same place and had interactions regarding the location of the watermelon was when they were in the staircase together for the second time (steps 16-23). + +During this time, Chloe moved the lemon to the green_cupboard (step 22), and Logan moved the watermelon to the red_bottle (step 31). Therefore, Chloe knows that Logan thinks the watermelon is in the red_bottle. + +However, the question asks where Chloe thinks Logan thinks Evelyn thinks the watermelon is. There is no information in the story that suggests Logan and Evelyn had any interactions or were in the same place regarding the location of the watermelon. Therefore, Chloe cannot infer Logan's thoughts about where Evelyn thinks the watermelon is. + +The answer is not provided in the multiple-choice options. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_7/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..61bb1aee2b14907bfb37120d4fd06e756eb345e2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_7/order_4.txt @@ -0,0 +1,58 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Charlotte think Chloe thinks Logan thinks Evelyn thinks the watermelon is? +Answer: green_cupboard +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_cupboard +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Charlotte think Chloe thinks Logan thinks Evelyn thinks the watermelon is? + +2. First, we need to determine where Logan thinks the watermelon is. According to step 31, Logan moved the watermelon to the red_bottle. Therefore, Logan thinks the watermelon is in the red_bottle. + +3. Next, we need to determine where Evelyn thinks the watermelon is. According to step 26, the watermelon is in the green_cupboard. However, we need to consider that agents tend to lie and that Charlotte may not trust Evelyn's claim. Therefore, we cannot be certain where Evelyn thinks the watermelon is. + +4. Now we need to determine where Logan thinks Evelyn thinks the watermelon is. Since Logan knows the watermelon is in the green_cupboard, he may assume that Evelyn also thinks the watermelon is in the green_cupboard. However, we cannot be certain. + +5. Next, we need to determine where Chloe thinks Logan thinks Evelyn thinks the watermelon is. Since Chloe exited the staircase after Logan, he may trust Logan's claim that the watermelon is in the red_bottle. Therefore, Chloe may think that Logan thinks Evelyn thinks the watermelon is in the red_bottle. + +6. Finally, we need to determine where Charlotte thinks Chloe thinks Logan thinks Evelyn thinks the watermelon is. Since Charlotte has not been in the same place as Chloe, Logan, or Evelyn, she cannot infer their thoughts directly. However, she may trust Chloe's claim about Logan's thoughts since Chloe exited the staircase after Logan. Therefore, Charlotte may think that Chloe thinks Logan thinks Evelyn thinks the watermelon is in the red_bottle. + +7. Based on the above analysis, the answer is (C) red_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_8/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ecac4a4902ec91913cfb041889bf7b68a9ecde97 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_8/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where is the lemon really? +Answer: green_drawer +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: To answer this question, we need to track the movements of the lemon and the agents who moved it. According to the story, the lemon was initially in the green_drawer in the garage. Jack moved it to the blue_pantry, Liam moved it to the blue_crate, Aiden moved it to the green_basket, and finally, Nathan moved it back to the green_drawer. Therefore, the lemon is in the L. green_drawer. The answer is L. green_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_8/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6b36363cdb2c4e9ba4ad9b8efcf799d47e8a5bd5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_8/order_1.txt @@ -0,0 +1,53 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Aiden really think the lemon is? +Answer: green_basket +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: To answer this question, we need to track the movements of the lemon and the agents. According to the story, Jack moved the lemon from the green_drawer to the blue_pantry, Liam moved it from the blue_pantry to the blue_crate, Aiden moved it from the blue_crate to the green_basket, and Nathan moved it from the green_basket to the green_drawer. Sophia did not move the lemon. + +We also need to consider the assumptions given, particularly the fact that agents tend to lie and that their public claims may not reflect their actual thoughts. + +Based on the story and the assumptions, we cannot be sure where Aiden really thinks the lemon is. Aiden may have claimed to move the lemon to the green_basket, but this may not reflect his actual belief. It is possible that Aiden thinks the lemon is in a different location, but we cannot determine which location based on the given information. + +Therefore, the answer is not provided in the options given and the correct answer is "Cannot be determined." \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_8/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..206f3688ac7c86a0fff3ac70240f2554dffa79ac --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_8/order_2.txt @@ -0,0 +1,60 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Nathan think Aiden thinks the lemon is? +Answer: green_basket +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: To answer this question, we need to track the movements of the lemon and the agents' interactions. Here are the steps to solve the question: + +1. Nathan moved the lemon to the green_drawer (step 11). +2. Aiden moved the lemon to the green_basket (step 7). +3. Nathan exited the garage (step 12). +4. Aiden exited the cellar (step 31). + +Based on assumption (2), Nathan can only infer Aiden's thought if they have been in the same place or have had private or public interactions. From the story, we know that Nathan and Aiden have never been in the same place together, so we need to look for any private or public interactions between them. + +From the story, we know that Aiden moved the lemon to the green_basket before Nathan exited the garage. Therefore, Nathan could have seen Aiden moving the lemon to the green_basket before he left the garage. However, we don't know if Nathan actually saw Aiden doing this or if he was paying attention to something else. + +Based on assumption (4), Nathan tends to trust an agent that exited the room later than himself. Since Nathan exited the garage before Aiden exited the cellar, he may not fully trust Aiden's movements with the lemon. + +Therefore, we cannot be certain where Nathan thinks Aiden thinks the lemon is. The answer is inconclusive. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_8/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..aaed4d4c1ba8b7e9a14f00890a39e6209b3ef844 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_8/order_3.txt @@ -0,0 +1,53 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Jack think Nathan thinks Aiden thinks the lemon is? +Answer: blue_pantry +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: To solve this question, we need to track the movements of the lemon and the agents' thoughts about its location. + +First, Jack moved the lemon from the green_drawer to the blue_pantry. Then, Liam moved it from the blue_pantry to the blue_crate. Aiden then moved it from the blue_crate to the green_basket. Finally, Nathan moved it from the green_basket to the green_drawer. + +We need to determine where Jack thinks Nathan thinks Aiden thinks the lemon is. Since Jack exited the garage before Nathan moved the lemon to the green_drawer, he does not know its current location. However, he knows that he likes the green_drawer, so he may assume that Nathan thinks Aiden put the lemon in the green_drawer. + +Therefore, the answer is L. green_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_8/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..fcf8323f8ef83051127e17703acbc84b3e5335e6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_8/order_4.txt @@ -0,0 +1,61 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Liam think Jack thinks Nathan thinks Aiden thinks the lemon is? +Answer: blue_pantry +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: This is a complex question that requires careful analysis of the story and the assumptions. We need to trace the movements of the lemon and the agents' thoughts about it. + +First, Jack moved the lemon from the green_drawer to the blue_pantry, and later made no movements in the garage for 1 minute. We know that Jack likes the green_drawer and dislikes the persimmon, but we don't know his thoughts about the lemon after he left the garage. + +Next, Liam moved the lemon from the blue_pantry to the blue_crate, and later made no movements in the garage for 1 minute. We don't know Liam's thoughts about the lemon, but we know that he lost his watch in the cellar. + +Then, Aiden moved the lemon from the blue_crate to the green_basket, and later exited the garage. We don't know Aiden's thoughts about the lemon. + +Sophia made no movements in the garage for 1 minute, and later moved the cherry from the red_envelope to the green_bottle in the cellar. We don't know her thoughts about the lemon. + +Finally, Nathan moved the lemon from the green_basket to the green_drawer, and later moved the eggplant from the green_envelope to the blue_crate in the garage. We know that Nathan saw a cat, but we don't know his thoughts about the lemon. + +Based on these movements and assumptions, we can infer Liam's thoughts about the lemon. Liam thinks that Jack thinks the lemon is in the blue_pantry, because that's where Jack left it and Liam doesn't know that Nathan moved it to the green_basket and then to the green_drawer. Liam thinks that Nathan thinks the lemon is in the green_drawer, because that's where Nathan moved it to. Liam thinks that Aiden thinks the lemon is in the green_basket, because that's where Aiden left it before exiting the garage. + +Therefore, the answer is O. green_basket, because that's where Liam thinks Aiden thinks the lemon is. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_9/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7f10242760335c39c818e46d0452f5785e110941 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_9/order_0.txt @@ -0,0 +1,57 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where is the cabbage really? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: To determine where the cabbage really is, we need to follow the movements of the agents and any statements they make. + +1. Isla, Elizabeth, William, Aiden, and Abigail entered the playroom. +2. The cabbage is in the blue_bathtub. +8. William moved the cabbage to the blue_treasure_chest. +10. Aiden moved the cabbage to the blue_bottle. +28. The cabbage is in the blue_bottle. +31. Isla moved the cabbage to the blue_bathtub. + +Based on these movements, we can see that the cabbage was initially in the blue bathtub, then moved to the blue treasure chest by William, then to the blue bottle by Aiden, and finally back to the blue bathtub by Isla. Therefore, the cabbage is really in the blue bathtub. + +The answer is F. blue_bathtub. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_9/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad6fa4514b6fa7156fa5b1b873012a8ba7362d53 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_9/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Isla really think the cabbage is? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: To answer this question, we need to look for any statements or actions made by Isla that indicate where she thinks the cabbage is. According to the story, Isla made no movements and stayed in the playroom for 1 minute before exiting. However, we do know that Isla likes the green bottle, and that she moved the cabbage to the blue bathtub before exiting the playroom. Therefore, the answer is K. green bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_9/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..0a9c7f3583b421de6dc7f1bbf4e489781c1d4b5b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_9/order_2.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Elizabeth think Isla thinks the cabbage is? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: To answer this question, we need to track the movements of Isla and the cabbage. Isla made no movements in the playroom before exiting, so she did not move the cabbage to any location while in the playroom. William moved the cabbage to the blue_treasure_chest before exiting the playroom. Aiden then moved the cabbage to the blue_bottle before exiting the playroom. Isla then entered the playroom again with William, Aiden, and Abigail. Isla moved the cabbage to the blue_bathtub before exiting the playroom again. + +Elizabeth was in the playroom with Isla, William, Aiden, and Abigail when the cabbage was in the blue_treasure_chest. She then exited the playroom before the cabbage was moved to the blue_bottle and did not re-enter the playroom until after Isla had moved the cabbage to the blue_bathtub. + +Based on these movements, Elizabeth would not have witnessed Isla moving the cabbage to the blue_bathtub. Therefore, she would not have any reason to think that Isla thinks the cabbage is in the blue_bathtub. We cannot determine where Elizabeth thinks Isla thinks the cabbage is based on the given information. The answer is not provided in the options given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_9/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..20fc39ad9a86ed2e1cc20df8dc721efbf6d23d95 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_9/order_3.txt @@ -0,0 +1,61 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Abigail think Elizabeth thinks Isla thinks the cabbage is? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: This is a complex question that requires careful analysis of the story and the assumptions provided. To break it down, we need to identify the agents involved and their movements, as well as any private or public interactions they may have had. + +Abigail, Elizabeth, and Isla are the agents mentioned in the question. We know that they were all in the playroom at some point, and that they all exited in a specific order (Isla first, then Elizabeth, then William, then Aiden, then Abigail). We also know that William moved the cabbage from the blue bathtub to the blue treasure chest, and that later Isla moved it back to the blue bathtub. + +Based on these facts, we can make some inferences about what each agent knows or thinks: + +- Abigail was the last to exit the playroom, so she would trust the exit order of the other agents. However, we don't know if she had any private or public interactions with Elizabeth or Isla that would give her more information about their thoughts. +- Elizabeth stayed in the playroom for one minute, but we don't know if she made any movements or had any interactions with the other agents. We do know that she likes the green treasure chest, but that doesn't necessarily mean she thinks the cabbage is there. +- Isla also stayed in the playroom for one minute, but made no movements. We do know that she likes the green bottle, but again, that doesn't tell us where she thinks the cabbage is. + +Given all of this, we can't say for certain where Abigail thinks Elizabeth thinks Isla thinks the cabbage is. We don't have enough information about their interactions or thoughts to make a definitive answer. However, we can eliminate some of the options based on what we do know: + +- We know that the lime is in the red envelope, so it's unlikely that anyone would think the cabbage is there. +- We know that the cabbage was in the blue bathtub at some point, so options like green bucket or red container are unlikely. + +Based on this reasoning, the most likely answer is either F (blue bathtub) or H (blue treasure chest), since we know the cabbage was in both of those places at different times. However, we can't say for sure which one Abigail thinks Elizabeth thinks Isla thinks it is. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_9/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..fad27fa65fabd8251e99e5dabae6b23f7c246988 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/CoT/length_3/sample_9/order_4.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Aiden think Abigail thinks Elizabeth thinks Isla thinks the cabbage is? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: This is a complex question that requires careful analysis. We need to work backwards from Aiden to Abigail to Elizabeth to Isla to the cabbage. + +First, we know that Aiden likes the blue_treasure_chest and that the cabbage is in the blue_bottle. We also know that William moved the cabbage to the blue_treasure_chest before Aiden moved it to the blue_bottle. Therefore, Aiden knows that the cabbage was in the blue_treasure_chest before it was in the blue_bottle. + +Next, we need to determine what Abigail thinks. We know that Abigail likes the green_drawer and made no movements in the playroom. Therefore, she did not move the cabbage. She also did not witness William moving the cabbage to the blue_treasure_chest or Aiden moving it to the blue_bottle. However, she knows that Isla likes the green_bottle because Isla made no movements in the closet and then exited the closet after Elizabeth. Therefore, Abigail might think that Isla moved the cabbage to the green_bottle. + +Moving on to Elizabeth, we know that she likes the green_treasure_chest and made no movements in the playroom. Therefore, she did not move the cabbage. She also did not witness William moving the cabbage to the blue_treasure_chest or Aiden moving it to the blue_bottle. However, she knows that Isla likes the green_bottle because Isla made no movements in the closet and then exited the closet after Elizabeth. Therefore, Elizabeth might think that Isla moved the cabbage to the green_bottle. + +Finally, we come to Isla. We know that Isla likes the green_bottle and moved the cabbage to the blue_bathtub. Therefore, Isla knows that the cabbage was not in the green_bottle when she entered the playroom. However, she might think that Elizabeth moved the cabbage to the green_bottle because Elizabeth made no movements in the closet and then exited the closet before Isla. + +Putting it all together, we have Aiden thinking that Abigail thinks Elizabeth thinks Isla thinks the cabbage is in the green_bottle. Therefore, the answer is K. green_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_1/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..95f6f66a8c700cd17bd6f14a0242b53c197fe32c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_1/order_0.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where is the lettuce really? +Answer: green_drawer +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: K. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_1/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1f419fe62b4ac6c4d97da7c6024a6c853d698d1a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_1/order_1.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Avery really think the lettuce is? +Answer: green_bathtub +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: O. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_1/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e3f454eb6295dfafb781120bc12fc8c15bbe5e6a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_1/order_2.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Charlotte think Avery thinks the lettuce is? +Answer: green_bathtub +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: K. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_1/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e77984ac8ec20a5462d6f95d43ecf558110f6e40 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_1/order_3.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Owen think Charlotte thinks Avery thinks the lettuce is? +Answer: green_bathtub +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +***Correct answer: green_bathtub +GPT-4 Explain: K. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_1/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..143180b73adfbf9471aabb419f018722064bab53 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_1/order_4.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Charlotte, Isabella, Elizabeth and Owen entered the living_room. +2 The lettuce is in the green_drawer. +3 Avery moved the lettuce to the green_bathtub. +4 Elizabeth dislikes the tangerine. +5 Avery exited the living_room. +6 Charlotte moved the lettuce to the blue_pantry. +7 Owen likes the green_envelope. +8 Charlotte exited the living_room. +9 Isabella made no movements and stayed in the living_room for 1 minute. +10 Isabella exited the living_room. +11 Owen dislikes the green_pepper. +12 Elizabeth made no movements and stayed in the living_room for 1 minute. +13 Elizabeth exited the living_room. +14 Owen moved the lettuce to the green_drawer. +15 Owen exited the living_room. +16 Avery, Charlotte, Isabella, Elizabeth and Owen entered the waiting_room. +Question: Where does Isabella think Owen thinks Charlotte thinks Avery thinks the lettuce is? +Answer: green_bathtub +Choices: A. blue_drawer, B. green_crate, C. red_bucket, D. green_bottle, E. red_basket, F. blue_suitcase, G. green_treasure_chest, H. green_box, I. red_envelope, J. red_pantry, K. green_drawer, L. blue_pantry, M. green_envelope, N. blue_crate, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +***Correct answer: green_bathtub +GPT-4 Explain: L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_10/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7651623e592e6f75075bf887ccee8f6bf5170d67 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_10/order_0.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where is the plum really? +Answer: red_pantry +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: I. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_10/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5d0746724cebdeccc168189302f6fd4c83ed1b12 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_10/order_1.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does William really think the plum is? +Answer: green_bucket +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: H. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_10/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..325627075e336edcaf9f284bc5be79055dea9705 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_10/order_2.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does Nathan think William thinks the plum is? +Answer: red_pantry +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: H. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_10/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..773d3e6b3ea08784e698ce906bcf32e10dc71295 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_10/order_3.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does Evelyn think Nathan thinks William thinks the plum is? +Answer: red_pantry +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: I. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_10/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..cff5ea540d02b7c13891d4eaad89daf5242fbffb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_10/order_4.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily dislikes the plum. +2 Nathan, Evelyn, William, Emily and Jacob entered the pantry. +3 The plum is in the red_pantry. +4 Nathan made no movements and stayed in the pantry for 1 minute. +5 Evelyn saw a monkey. +6 Nathan exited the pantry. +7 Evelyn moved the plum to the green_bucket. +8 Evelyn exited the pantry. +9 William made no movements and stayed in the pantry for 1 minute. +10 William exited the pantry. +11 Emily made no movements and stayed in the pantry for 1 minute. +12 Nathan saw a mouse. +13 Emily exited the pantry. +14 Jacob moved the plum to the red_pantry. +15 Jacob exited the pantry. +16 Nathan, Evelyn, William, Emily and Jacob entered the waiting_room. +Question: Where does Jacob think Evelyn thinks Nathan thinks William thinks the plum is? +Answer: red_pantry +Choices: A. red_drawer, B. green_bottle, C. blue_bathtub, D. blue_treasure_chest, E. red_box, F. green_crate, G. red_pantry, H. green_pantry, I. green_bucket, J. red_crate, K. green_envelope, L. green_drawer, M. blue_suitcase, N. green_box, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: I. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_11/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0190d7e12622908e2f2bce90389f2c87278299fe --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_11/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where is the orange really? +Answer: red_box +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: H. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_11/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..74d89a6ddeb691af715a51075108069900456558 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_11/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Ella really think the orange is? +Answer: red_envelope +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: H. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_11/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d2105296fa3f138df1fb8e6acc4debd992c043c6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_11/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Elizabeth think Ella thinks the orange is? +Answer: red_envelope +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: H. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_11/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..14b66f8a245319426c0c825ea51a548db9551817 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_11/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Chloe think Elizabeth thinks Ella thinks the orange is? +Answer: red_box +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: H. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_11/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d9a98dd433d59c7ebb2fb907223c72ca630def82 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_11/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the study. +2 The orange is in the red_box. +3 Chloe made no movements and stayed in the study for 1 minute. +4 Alexander lost his phone. +5 Chloe exited the study. +6 Benjamin moved the orange to the red_envelope. +7 Benjamin exited the study. +8 Alexander made no movements and stayed in the study for 1 minute. +9 Alexander exited the study. +10 Ella made no movements and stayed in the study for 1 minute. +11 Benjamin saw a cat. +12 Ella exited the study. +13 Elizabeth moved the orange to the red_box. +14 Elizabeth exited the study. +15 Chloe, Benjamin, Alexander, Ella and Elizabeth entered the waiting_room. +Question: Where does Alexander think Chloe thinks Elizabeth thinks Ella thinks the orange is? +Answer: red_box +Choices: A. red_bottle, B. blue_suitcase, C. red_basket, D. blue_bathtub, E. blue_cupboard, F. red_box, G. green_envelope, H. red_envelope, I. blue_bucket, J. green_box, K. green_bottle, L. green_basket, M. blue_drawer, N. blue_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: H. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_12/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..41a2696eae90a212f9e9bc69009dfe6d04681eda --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_12/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where is the melon really? +Answer: red_bottle +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bottle +GPT-4 Explain: I. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_12/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6183c3bc25b4e1c64a8d37e2fa56dca9642b31b3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_12/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does William really think the melon is? +Answer: red_bottle +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bottle +GPT-4 Explain: I. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_12/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..fa644d9279b0a3d9cb0a64667ecd32c1c32f7e1b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_12/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does Mila think William thinks the melon is? +Answer: green_box +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: I. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_12/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b21a7da1feb5efd3842da835d7ab968d8bbc542a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_12/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does Ella think Mila thinks William thinks the melon is? +Answer: green_box +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: I. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_12/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c11bf985e2c92e458315c129418eae39981d916b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_12/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Liam, Ella and William entered the garden. +2 The melon is in the green_box. +3 Mila made no movements and stayed in the garden for 1 minute. +4 Mila exited the garden. +5 Ava moved the melon to the green_basket. +6 Ava exited the garden. +7 Liam made no movements and stayed in the garden for 1 minute. +8 Liam exited the garden. +9 Ella moved the melon to the red_bottle. +10 Liam saw a mouse. +11 Ella exited the garden. +12 William made no movements and stayed in the garden for 1 minute. +13 William exited the garden. +14 Mila, Ava, Liam, Ella and William entered the waiting_room. +Question: Where does Ava think Ella thinks Mila thinks William thinks the melon is? +Answer: green_box +Choices: A. green_cupboard, B. blue_bottle, C. green_pantry, D. red_crate, E. red_box, F. green_basket, G. green_box, H. blue_cupboard, I. red_bottle, J. blue_drawer, K. green_treasure_chest, L. green_bottle, M. green_bathtub, N. green_drawer, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: I. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_13/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..43c208d177dd6107dea68140de9f8e9f7ee42f76 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_13/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where is the cabbage really? +Answer: blue_crate +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: H. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_13/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d88c46834f8f5b9e041d79347e9ffe39387ecde8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_13/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Abigail really think the cabbage is? +Answer: green_crate +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: H. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_13/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..817841ca5de779244409aaf63b94b497eb008876 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_13/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Nathan think Abigail thinks the cabbage is? +Answer: green_crate +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: H. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_13/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8658a51f127ea7f78d5c3d52b1c62fb013602062 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_13/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Amelia think Nathan thinks Abigail thinks the cabbage is? +Answer: green_envelope +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: I. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_13/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..532db904ecf41baa2d154a5455e447f7115cf86c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_13/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Amelia, Abigail, Charlotte, Carter and Nathan entered the laundry. +2 The cabbage is in the red_container. +3 Amelia moved the cabbage to the green_envelope. +4 Amelia exited the laundry. +5 Abigail moved the cabbage to the green_crate. +6 Abigail exited the laundry. +7 Charlotte moved the cabbage to the blue_crate. +8 Charlotte exited the laundry. +9 Carter made no movements and stayed in the laundry for 1 minute. +10 Carter exited the laundry. +11 Nathan made no movements and stayed in the laundry for 1 minute. +12 Nathan exited the laundry. +13 Amelia, Abigail, Charlotte, Carter and Nathan entered the waiting_room. +Question: Where does Charlotte think Amelia thinks Nathan thinks Abigail thinks the cabbage is? +Answer: green_envelope +Choices: A. blue_bathtub, B. green_box, C. green_drawer, D. red_bucket, E. green_treasure_chest, F. blue_crate, G. red_container, H. green_crate, I. green_envelope, J. green_pantry, K. red_crate, L. red_envelope, M. green_bucket, N. blue_pantry, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: H. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_14/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..332151f77b9f8564f24407887ec7484bd1d729ba --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_14/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where is the lime really? +Answer: green_envelope +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: N. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_14/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6e812abc2be551c2aae38713a7679f2f6c8e7c95 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_14/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Abigail really think the lime is? +Answer: green_envelope +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: K. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_14/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..05a37b3cc3af76abce95e5f0e30b79b6cd260f03 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_14/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Avery think Abigail thinks the lime is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: K. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_14/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5897e6cc22c43c2444156eb0263f8003b65f0f0d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_14/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Jack think Avery thinks Abigail thinks the lime is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: N. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_14/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e98889de477ae6b77a5b041d6537ac8373fb6c84 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_14/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Jack, Avery, Aiden and Abigail entered the playroom. +2 The lime is in the green_envelope. +3 Emily moved the lime to the blue_pantry. +4 Emily exited the playroom. +5 Jack moved the lime to the blue_suitcase. +6 Jack exited the playroom. +7 Avery made no movements and stayed in the playroom for 1 minute. +8 Avery exited the playroom. +9 Emily likes the green_crate. +10 Aiden made no movements and stayed in the playroom for 1 minute. +11 Aiden exited the playroom. +12 Avery likes the red_basket. +13 Abigail moved the lime to the green_envelope. +14 Abigail exited the playroom. +15 Emily, Jack, Avery, Aiden and Abigail entered the waiting_room. +Question: Where does Aiden think Jack thinks Avery thinks Abigail thinks the lime is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_crate, C. blue_treasure_chest, D. red_box, E. red_basket, F. green_crate, G. blue_drawer, H. red_bucket, I. green_basket, J. green_bathtub, K. green_envelope, L. green_bottle, M. blue_suitcase, N. blue_pantry, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: M. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_15/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..376dcfbb749b5c9dc3d42fc5f4499fc41aae7f2c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_15/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where is the watermelon really? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_15/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..089e8ffd6458d028e788c39e33fc94f0262dd601 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_15/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Avery really think the watermelon is? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_15/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b4de03328e22e92cff562827e468f8985894c7d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_15/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Owen think Avery thinks the watermelon is? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_15/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c13e36f099b938c3aa6186aea956dd397e54f78f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_15/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Ella think Owen thinks Avery thinks the watermelon is? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: N. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_15/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c6a8fe0624bed0743c1f861711cf401b6547ef89 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_15/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Owen, Ella, Ava and Amelia entered the back_yard. +2 The watermelon is in the blue_container. +3 Avery made no movements and stayed in the back_yard for 1 minute. +4 Avery exited the back_yard. +5 Owen made no movements and stayed in the back_yard for 1 minute. +6 Owen exited the back_yard. +7 Ella moved the watermelon to the red_pantry. +8 Ella exited the back_yard. +9 Ava made no movements and stayed in the back_yard for 1 minute. +10 Ava exited the back_yard. +11 Amelia moved the watermelon to the blue_container. +12 Amelia exited the back_yard. +13 Avery, Owen, Ella, Ava and Amelia entered the waiting_room. +Question: Where does Amelia think Ella thinks Owen thinks Avery thinks the watermelon is? +Answer: blue_container +Choices: A. red_crate, B. green_crate, C. blue_suitcase, D. red_bottle, E. green_basket, F. green_box, G. red_container, H. blue_crate, I. red_bucket, J. green_cupboard, K. green_bucket, L. blue_container, M. green_drawer, N. red_pantry, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: N. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_16/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c1441b6d232cf357609dae536c5938d80ae85e59 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_16/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where is the carrot really? +Answer: red_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: B. red_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_16/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..11a85f9147407d3bdd0f4eb68970ecfaf54ef73c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_16/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does William really think the carrot is? +Answer: blue_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: C. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_16/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5358b4c9249521e403f0f342b4dbc586b6b0d7fa --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_16/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does Evelyn think William thinks the carrot is? +Answer: blue_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: C. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_16/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..fa5a87eb9f8e3d0b1979535a7470474d5cdd8922 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_16/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does Logan think Evelyn thinks William thinks the carrot is? +Answer: blue_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: C. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_16/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5bdbca743012140f8d887d559421db178959d12 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_16/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Evelyn, William, Alexander and Logan entered the cellar. +2 The carrot is in the red_container. +3 Isabella moved the carrot to the blue_container. +4 Logan likes the green_drawer. +5 Isabella exited the cellar. +6 Evelyn made no movements and stayed in the cellar for 1 minute. +7 Logan likes the green_bucket. +8 Evelyn exited the cellar. +9 William made no movements and stayed in the cellar for 1 minute. +10 William exited the cellar. +11 Alexander moved the carrot to the green_bathtub. +12 Alexander exited the cellar. +13 Logan moved the carrot to the red_container. +14 Logan exited the cellar. +15 Isabella, Evelyn, William, Alexander and Logan entered the waiting_room. +Question: Where does Alexander think Logan thinks Evelyn thinks William thinks the carrot is? +Answer: blue_container +Choices: A. green_cupboard, B. red_container, C. green_bathtub, D. blue_suitcase, E. blue_container, F. green_box, G. green_envelope, H. red_basket, I. red_envelope, J. blue_crate, K. green_drawer, L. green_bucket, M. red_crate, N. blue_bottle, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: C. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_17/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8a44665dfd6a1e8d17f2be3d5ae720c354bdcb2b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_17/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where is the lettuce really? +Answer: blue_container +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_17/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..abc623f2dd2c74200bbc22230d33329fe5eaa040 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_17/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Liam really think the lettuce is? +Answer: blue_crate +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_17/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..17ed30c82c448717cb15137183f6f9e856f1f02f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_17/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Emma think Liam thinks the lettuce is? +Answer: blue_crate +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_17/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..541e16c930138b36b98953ef9361d5baf1fe5128 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_17/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Mila think Emma thinks Liam thinks the lettuce is? +Answer: blue_crate +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_17/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..67e02a5874b1eb60736ac5e1f3b1c76ca818f8ac --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_17/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Liam, Emma, Alexander and Avery entered the patio. +2 The lettuce is in the blue_crate. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Liam made no movements and stayed in the patio for 1 minute. +6 Liam exited the patio. +7 Emma made no movements and stayed in the patio for 1 minute. +8 Emma exited the patio. +9 Mila lost his phone. +10 Alexander moved the lettuce to the blue_container. +11 Alexander exited the patio. +12 Avery made no movements and stayed in the patio for 1 minute. +13 Avery saw a mouse. +14 Avery exited the patio. +15 Mila, Liam, Emma, Alexander and Avery entered the waiting_room. +Question: Where does Avery think Mila thinks Emma thinks Liam thinks the lettuce is? +Answer: blue_crate +Choices: A. red_box, B. green_pantry, C. red_crate, D. blue_bathtub, E. blue_treasure_chest, F. blue_crate, G. red_pantry, H. green_crate, I. blue_container, J. green_cupboard, K. red_envelope, L. red_drawer, M. blue_drawer, N. red_bucket, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_18/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e7792d0c09029f8e71ccf0948c8cabe5df188c7b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_18/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where is the corn really? +Answer: green_crate +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: B. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_18/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2f26e96faea335133955e718f6b5611d2280217a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_18/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Benjamin really think the corn is? +Answer: green_crate +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: A. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_18/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..397c12c3a5c80133316912228f965ee64b27428c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_18/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Jackson think Benjamin thinks the corn is? +Answer: blue_treasure_chest +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: B. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_18/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1d67cb260cda5291f42697bc28396625c1ef9fbf --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_18/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Liam think Jackson thinks Benjamin thinks the corn is? +Answer: blue_treasure_chest +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: B. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_18/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3d44d400b994eafcb9a4277786f7474c30b48b86 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_18/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Charlotte, Avery, Liam and Benjamin entered the cellar. +2 The corn is in the blue_treasure_chest. +3 Jackson made no movements and stayed in the cellar for 1 minute. +4 Jackson exited the cellar. +5 Charlotte moved the corn to the green_crate. +6 Charlotte exited the cellar. +7 Avery likes the blue_bathtub. +8 Avery made no movements and stayed in the cellar for 1 minute. +9 Avery exited the cellar. +10 Liam made no movements and stayed in the cellar for 1 minute. +11 Liam exited the cellar. +12 Benjamin made no movements and stayed in the cellar for 1 minute. +13 Benjamin exited the cellar. +14 Jackson, Charlotte, Avery, Liam and Benjamin entered the waiting_room. +Question: Where does Charlotte think Liam thinks Jackson thinks Benjamin thinks the corn is? +Answer: blue_treasure_chest +Choices: A. blue_treasure_chest, B. green_crate, C. red_pantry, D. green_bathtub, E. blue_bathtub, F. red_basket, G. green_drawer, H. green_pantry, I. red_crate, J. red_drawer, K. green_treasure_chest, L. green_cupboard, M. red_container, N. green_bottle, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: B. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_19/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a8a7ed8310b3bb3ae4701ce0b8d258e2742a95b9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_19/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where is the asparagus really? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_19/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..47e5ea5219418af410b2e44f2992c4fb940ca52b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_19/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Emily really think the asparagus is? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_19/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b5d7c04c2ff89c01a0d419a785995595e7062324 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_19/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Hannah think Emily thinks the asparagus is? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_19/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2ee66a0f9bc183bd83fd2ebba49d287e8bff04f1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_19/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Amelia think Hannah thinks Emily thinks the asparagus is? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_19/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3e9726febd21a95e752e217c0f588975aa172531 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_19/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Abigail, Amelia, Elizabeth and Hannah entered the staircase. +2 The asparagus is in the green_bottle. +3 Emily made no movements and stayed in the staircase for 1 minute. +4 Emily exited the staircase. +5 Abigail made no movements and stayed in the staircase for 1 minute. +6 Abigail exited the staircase. +7 Amelia made no movements and stayed in the staircase for 1 minute. +8 Amelia exited the staircase. +9 Elizabeth made no movements and stayed in the staircase for 1 minute. +10 Elizabeth exited the staircase. +11 Hannah made no movements and stayed in the staircase for 1 minute. +12 Hannah exited the staircase. +13 Emily, Abigail, Amelia, Elizabeth and Hannah entered the waiting_room. +Question: Where does Abigail think Amelia thinks Hannah thinks Emily thinks the asparagus is? +Answer: green_bottle +Choices: A. green_basket, B. green_envelope, C. red_container, D. red_basket, E. blue_bucket, F. red_crate, G. blue_cupboard, H. green_cupboard, I. blue_bathtub, J. red_bottle, K. blue_bottle, L. green_bottle, M. green_box, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_2/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0fe6139bc3d2c396d20f946cd5e28e569f57819c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_2/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where is the tomato really? +Answer: blue_container +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: E. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_2/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..47b26be44c75b610dcbb7f8e0980ef03e1c15af8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_2/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Jacob really think the tomato is? +Answer: blue_container +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: E. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_2/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a251f05af4e168239ed9d3571b172bf106aa2b0e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_2/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Hannah think Jacob thinks the tomato is? +Answer: blue_container +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: E. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_2/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..192c51bb2e97554eee43791bac46adfea3c6aada --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_2/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Isabella think Hannah thinks Jacob thinks the tomato is? +Answer: green_box +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +***Correct answer: green_box +GPT-4 Explain: E. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_2/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b58f3b64bf8aca0132b32114adbb95ed8d4504c2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_2/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Carter, Elizabeth, Hannah and Jacob entered the bedroom. +2 The tomato is in the green_bottle. +3 Isabella moved the tomato to the green_box. +4 Isabella exited the bedroom. +5 Carter made no movements and stayed in the bedroom for 1 minute. +6 Carter exited the bedroom. +7 Elizabeth moved the tomato to the blue_container. +8 Elizabeth exited the bedroom. +9 Hannah made no movements and stayed in the bedroom for 1 minute. +10 Jacob lost his watch. +11 Hannah exited the bedroom. +12 Jacob made no movements and stayed in the bedroom for 1 minute. +13 Jacob exited the bedroom. +14 Isabella, Carter, Elizabeth, Hannah and Jacob entered the waiting_room. +Question: Where does Elizabeth think Isabella thinks Hannah thinks Jacob thinks the tomato is? +Answer: green_box +Choices: A. green_bottle, B. red_basket, C. green_bucket, D. green_box, E. blue_container, F. red_drawer, G. blue_bucket, H. green_envelope, I. blue_bathtub, J. blue_crate, K. red_envelope, L. red_box, M. green_crate, N. green_basket, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +***Correct answer: green_box +GPT-4 Explain: E. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_20/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..66d684b196701af0ca4a591340b2e87bee16f47a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_20/order_0.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where is the watermelon really? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: E. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_20/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..be12117227becdcf3518c3cdf66ed56ea121b876 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_20/order_1.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Ava really think the watermelon is? +Answer: green_bottle +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_20/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a72c9728b25be4198c36dae43794f32d7248a97b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_20/order_2.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Jacob think Ava thinks the watermelon is? +Answer: green_bottle +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_20/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a0359ecbce189768dc89c6995a700dc91d158002 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_20/order_3.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Emily think Jacob thinks Ava thinks the watermelon is? +Answer: green_bottle +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_20/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b28b5f708c02adfec5a3ae4a0088b8b7085a125a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_20/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Ava, Emily, Evelyn and Jacob entered the front_yard. +2 The watermelon is in the blue_cupboard. +3 Mila moved the watermelon to the red_box. +4 Mila exited the front_yard. +5 Ava moved the watermelon to the green_bottle. +6 Ava exited the front_yard. +7 Emily moved the watermelon to the blue_bathtub. +8 Emily exited the front_yard. +9 Evelyn made no movements and stayed in the front_yard for 1 minute. +10 Evelyn exited the front_yard. +11 Jacob made no movements and stayed in the front_yard for 1 minute. +12 Jacob exited the front_yard. +13 Mila, Ava, Emily, Evelyn and Jacob entered the waiting_room. +Question: Where does Evelyn think Emily thinks Jacob thinks Ava thinks the watermelon is? +Answer: green_bottle +Choices: A. blue_bathtub, B. blue_cupboard, C. blue_pantry, D. green_bottle, E. red_box, F. red_drawer, G. red_bucket, H. blue_suitcase, I. blue_bottle, J. green_treasure_chest, K. blue_drawer, L. green_basket, M. red_envelope, N. green_envelope, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: E. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_3/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..57f2c8896bcb42c5e24c816a12635c944a6e8e81 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_3/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where is the eggplant really? +Answer: green_envelope +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: F. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_3/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad94bf933f73c5d6801206714d78bbe01933a523 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_3/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Noah really think the eggplant is? +Answer: green_envelope +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: F. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_3/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b7561d342a450b82abf478f5dc096d386c267456 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_3/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Hannah think Noah thinks the eggplant is? +Answer: blue_cupboard +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +***Correct answer: blue_cupboard +GPT-4 Explain: Hannah thinks Noah thinks the eggplant is in the green_basket. Answer: J. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_3/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f4439716d8d5e326f27d34d7fddfa817c90072fb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_3/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Jack think Hannah thinks Noah thinks the eggplant is? +Answer: green_bathtub +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +***Correct answer: green_bathtub +GPT-4 Explain: H. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_3/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d032195b671436e189ed54b927b76ff6e15c3400 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_3/order_4.txt @@ -0,0 +1,22 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jack, Hannah, Owen and Noah entered the pantry. +2 The eggplant is in the green_envelope. +3 Liam made no movements and stayed in the pantry for 1 minute. +4 Liam exited the pantry. +5 Noah lost his gloves. +6 Jack moved the eggplant to the green_bathtub. +7 Jack exited the pantry. +8 Hannah moved the eggplant to the blue_cupboard. +9 Hannah exited the pantry. +10 Owen moved the eggplant to the green_basket. +11 Owen exited the pantry. +12 Noah moved the eggplant to the green_envelope. +13 Noah exited the pantry. +14 Liam, Jack, Hannah, Owen and Noah entered the waiting_room. +Question: Where does Owen think Jack thinks Hannah thinks Noah thinks the eggplant is? +Answer: green_bathtub +Choices: A. green_treasure_chest, B. blue_treasure_chest, C. red_crate, D. blue_drawer, E. green_pantry, F. green_envelope, G. green_bathtub, H. blue_cupboard, I. blue_container, J. green_basket, K. blue_bottle, L. green_drawer, M. red_box, N. red_pantry, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims.Correct answer: green_bathtub +GPT-4 Explain: H. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_4/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..cad5f383920c023659293a19182d1fc600621df5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_4/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where is the spinach really? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_4/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b5e95f012a09f5a8db9c1e1bd140988059f96d84 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_4/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Noah really think the spinach is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_4/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..84ec401fa2804a369c60770085baa5a07d00bf8a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_4/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Mila think Noah thinks the spinach is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_4/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4d6a4f2a204b30404debeb9fd6d80640552c9279 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_4/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Emily think Mila thinks Noah thinks the spinach is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_4/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..535436fb1976a78829c113f975adce77b579dd8d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_4/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn saw a dog. +2 Noah, Emily, Avery, Evelyn and Mila entered the front_yard. +3 The spinach is in the green_bucket. +4 Noah made no movements and stayed in the front_yard for 1 minute. +5 Noah exited the front_yard. +6 Emily made no movements and stayed in the front_yard for 1 minute. +7 Emily exited the front_yard. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Evelyn made no movements and stayed in the front_yard for 1 minute. +11 Evelyn exited the front_yard. +12 Avery saw a cat. +13 Mila moved the spinach to the green_bucket. +14 Mila exited the front_yard. +15 Noah, Emily, Avery, Evelyn and Mila entered the waiting_room. +Question: Where does Evelyn think Emily thinks Mila thinks Noah thinks the spinach is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. blue_bottle, C. blue_drawer, D. blue_suitcase, E. green_basket, F. blue_cupboard, G. green_bottle, H. green_treasure_chest, I. green_cupboard, J. red_pantry, K. green_bucket, L. blue_bucket, M. green_box, N. red_crate, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_5/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f9df622156a15fc9e69638739c1581a7a7e6239b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_5/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where is the potato really? +Answer: red_bottle +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bottle +GPT-4 Explain: N. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_5/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3b419bd9d9d2589a8c3410b53147e4de38109e38 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_5/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Logan really think the potato is? +Answer: green_envelope +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: N. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_5/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..aa6d9d56d8b8ee90c853bc85094cd0cf752d1db7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_5/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Benjamin think Logan thinks the potato is? +Answer: green_envelope +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: N. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_5/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cffdef7b450b2b2bdc3ca99f21dbeaf5babf21f8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_5/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Charlotte think Benjamin thinks Logan thinks the potato is? +Answer: green_envelope +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: N. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_5/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..784f2772bd71ccd576c0526820fea3252b7e63aa --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_5/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the patio. +2 The potato is in the green_envelope. +3 Charlotte likes the red_bottle. +4 Logan made no movements and stayed in the patio for 1 minute. +5 Logan exited the patio. +6 Charlotte moved the potato to the red_bottle. +7 Charlotte exited the patio. +8 Hannah made no movements and stayed in the patio for 1 minute. +9 Hannah exited the patio. +10 Benjamin made no movements and stayed in the patio for 1 minute. +11 Benjamin exited the patio. +12 Evelyn made no movements and stayed in the patio for 1 minute. +13 Evelyn exited the patio. +14 Logan, Charlotte, Hannah, Benjamin and Evelyn entered the waiting_room. +Question: Where does Hannah think Charlotte thinks Benjamin thinks Logan thinks the potato is? +Answer: green_envelope +Choices: A. green_pantry, B. red_container, C. green_bathtub, D. blue_bottle, E. green_treasure_chest, F. blue_bathtub, G. red_drawer, H. red_pantry, I. green_cupboard, J. red_basket, K. red_envelope, L. green_envelope, M. blue_cupboard, N. red_bottle, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: N. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_6/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fedd311ce394fc4fc69ec482e6d6a74ab739488f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_6/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where is the apple really? +Answer: red_box +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: N. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_6/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1987a73643548938621abdccab058b47c2f1870e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_6/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Lily really think the apple is? +Answer: red_box +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: N. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_6/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..819e7c16953348e0fb474c385b1bb7fbbfd1ac03 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_6/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Hannah think Lily thinks the apple is? +Answer: blue_cupboard +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: N. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_6/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8c6c3ce4065bcec133f097c0bda7ae9e80ee9655 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_6/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Jack think Hannah thinks Lily thinks the apple is? +Answer: blue_cupboard +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: N. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_6/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e08f6a780c812907ddf1a5058decce02638e8e75 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_6/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Lily, Logan and Aiden entered the closet. +2 The apple is in the green_bathtub. +3 Hannah moved the apple to the blue_cupboard. +4 Hannah exited the closet. +5 Jack moved the apple to the green_drawer. +6 Jack exited the closet. +7 Lily moved the apple to the red_box. +8 Hannah likes the blue_drawer. +9 Lily exited the closet. +10 Logan made no movements and stayed in the closet for 1 minute. +11 Logan exited the closet. +12 Logan likes the green_pantry. +13 Aiden made no movements and stayed in the closet for 1 minute. +14 Aiden exited the closet. +15 Hannah, Jack, Lily, Logan and Aiden entered the waiting_room. +Question: Where does Aiden think Jack thinks Hannah thinks Lily thinks the apple is? +Answer: blue_cupboard +Choices: A. green_pantry, B. blue_bottle, C. blue_treasure_chest, D. blue_drawer, E. red_crate, F. green_bucket, G. green_basket, H. red_basket, I. green_box, J. green_cupboard, K. green_bathtub, L. green_crate, M. green_drawer, N. red_box, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: N. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_7/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..039f70bbc4d5e882d093a6083ee063f72bafb110 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_7/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where is the spinach really? +Answer: green_envelope +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: H. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_7/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..92d651763e6db80244a75be8c4041748fc651d56 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_7/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Emma really think the spinach is? +Answer: green_envelope +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: H. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_7/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a66ab6fc15cb358287a334cf4733dec7f8eb3598 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_7/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Ella think Emma thinks the spinach is? +Answer: green_basket +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: H. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_7/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..74dfb196e8be9e98fbf792c6518c96cfb943c9c2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_7/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Aiden think Ella thinks Emma thinks the spinach is? +Answer: green_basket +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: H. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_7/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0d4071644f9072bc3df1a4abcdefc61672fcf512 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_7/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Aiden, Jack, Benjamin and Emma entered the attic. +2 The spinach is in the red_bottle. +3 Ella moved the spinach to the green_basket. +4 Ella exited the attic. +5 Aiden made no movements and stayed in the attic for 1 minute. +6 Aiden exited the attic. +7 Jack made no movements and stayed in the attic for 1 minute. +8 Jack exited the attic. +9 Benjamin moved the spinach to the green_envelope. +10 Aiden dislikes the turnip. +11 Benjamin exited the attic. +12 Emma made no movements and stayed in the attic for 1 minute. +13 Emma exited the attic. +14 Ella, Aiden, Jack, Benjamin and Emma entered the waiting_room. +Question: Where does Benjamin think Aiden thinks Ella thinks Emma thinks the spinach is? +Answer: green_basket +Choices: A. red_crate, B. red_drawer, C. green_drawer, D. green_treasure_chest, E. green_bathtub, F. green_envelope, G. red_bottle, H. green_basket, I. blue_bucket, J. green_cupboard, K. blue_bottle, L. blue_cupboard, M. red_pantry, N. red_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: F. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_8/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..85f3f0dd89686bff132304b707e303d5c638c431 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_8/order_0.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where is the corn really? +Answer: blue_suitcase +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_8/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..80f193a69f9572648dbcddc59704bc4bcbd4f432 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_8/order_1.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Sophia really think the corn is? +Answer: blue_suitcase +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_8/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6cb62aa7b6e3bd93512f3986691dadf08de0bbf1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_8/order_2.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Chloe think Sophia thinks the corn is? +Answer: green_crate +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_8/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cd2ad966933e76335e869ec739bf41ace2d2b0d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_8/order_3.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Ella think Chloe thinks Sophia thinks the corn is? +Answer: green_crate +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_8/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..26692ac1d37874b9d59e1a149b7d0756c58f9d2c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_8/order_4.txt @@ -0,0 +1,23 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Ella, Chloe, Sophia and Noah entered the crawlspace. +2 The corn is in the green_crate. +3 Owen made no movements and stayed in the crawlspace for 1 minute. +4 Owen exited the crawlspace. +5 Ella made no movements and stayed in the crawlspace for 1 minute. +6 Ella exited the crawlspace. +7 Chloe made no movements and stayed in the crawlspace for 1 minute. +8 Ella dislikes the corn. +9 Chloe exited the crawlspace. +10 Sophia moved the corn to the blue_suitcase. +11 Sophia exited the crawlspace. +12 Noah made no movements and stayed in the crawlspace for 1 minute. +13 Noah exited the crawlspace. +14 Owen, Ella, Chloe, Sophia and Noah entered the waiting_room. +Question: Where does Owen think Ella thinks Chloe thinks Sophia thinks the corn is? +Answer: green_crate +Choices: A. red_crate, B. red_box, C. green_envelope, D. green_drawer, E. red_pantry, F. green_crate, G. blue_pantry, H. blue_bucket, I. red_drawer, J. blue_suitcase, K. blue_bathtub, L. red_container, M. green_box, N. green_bathtub, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_9/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..35d96d29fcf7d236d47a96b993a9e782031037c3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_9/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where is the banana really? +Answer: green_envelope +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: G. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_9/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..99ec6aa7f1468296b26a18a9e0d169507d758f87 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_9/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Abigail really think the banana is? +Answer: blue_bottle +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bottle +GPT-4 Explain: F. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_9/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..14bbdc4bab4c06535685eeb3f3d292cd3c061a06 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_9/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Ella think Abigail thinks the banana is? +Answer: blue_bottle +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bottle +GPT-4 Explain: E. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_9/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6c31edd7cdee9b4af0aba6dd911383fd36d65e83 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_9/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Elizabeth think Ella thinks Abigail thinks the banana is? +Answer: green_envelope +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: E. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_9/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b37ed75c722920404201d76d93622044bc5bb6d7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_1/sample_9/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Ava, Abigail, Ella and Owen entered the bedroom. +2 The banana is in the green_envelope. +3 Elizabeth made no movements and stayed in the bedroom for 1 minute. +4 Elizabeth exited the bedroom. +5 Owen saw a cat. +6 Ava made no movements and stayed in the bedroom for 1 minute. +7 Ava exited the bedroom. +8 Abigail moved the banana to the blue_bottle. +9 Abigail exited the bedroom. +10 Abigail likes the red_pantry. +11 Ella made no movements and stayed in the bedroom for 1 minute. +12 Ella exited the bedroom. +13 Owen moved the banana to the green_envelope. +14 Owen exited the bedroom. +15 Elizabeth, Ava, Abigail, Ella and Owen entered the waiting_room. +Question: Where does Owen think Elizabeth thinks Ella thinks Abigail thinks the banana is? +Answer: green_envelope +Choices: A. green_cupboard, B. blue_bathtub, C. red_box, D. green_bucket, E. red_pantry, F. blue_bottle, G. green_envelope, H. green_basket, I. blue_cupboard, J. green_drawer, K. blue_bucket, L. red_basket, M. green_crate, N. blue_suitcase, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: F. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_1/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7ea2c61e8fd47aebabc5e0803cf0dbf4cc1f8169 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_1/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where is the cucumber really? +Answer: green_treasure_chest +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: M. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_1/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c984a188bee9a4a9d2bc29b28fb747848f8d7ed0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_1/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Evelyn really think the cucumber is? +Answer: red_envelope +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: F. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_1/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..cb63025b4211c22f3baf9bc7f1401fb5c8187574 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_1/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Ava think Evelyn thinks the cucumber is? +Answer: green_treasure_chest +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: F. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_1/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7626fa355178ae2ff68c40f3bc77fea9a22cfa52 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_1/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Charlotte think Ava thinks Evelyn thinks the cucumber is? +Answer: green_treasure_chest +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: M. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_1/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..598d460143f731048394b2f2924091eb7701c84b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_1/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Evelyn, Charlotte, William and Jacob entered the dining_room. +2 The cucumber is in the green_treasure_chest. +3 Ava made no movements and stayed in the dining_room for 1 minute. +4 Ava exited the dining_room. +5 Evelyn moved the cucumber to the red_envelope. +6 Evelyn exited the dining_room. +7 Charlotte moved the cucumber to the red_crate. +8 Charlotte exited the dining_room. +9 William made no movements and stayed in the dining_room for 1 minute. +10 William exited the dining_room. +11 Jacob moved the cucumber to the green_treasure_chest. +12 Jacob exited the dining_room. +13 Ava, Evelyn, Charlotte, William and Jacob entered the waiting_room. +14 Evelyn, Jacob and Charlotte entered the pantry. +15 The watermelon is in the green_basket. +16 Evelyn moved the watermelon to the blue_cupboard. +17 Evelyn exited the pantry. +18 Jacob moved the watermelon to the red_pantry. +19 Jacob exited the pantry. +20 Charlotte made no movements and stayed in the pantry for 1 minute. +21 Charlotte exited the pantry. +22 Evelyn, Jacob and Charlotte entered the waiting_room. +Question: Where does Jacob think Charlotte thinks Ava thinks Evelyn thinks the cucumber is? +Answer: green_treasure_chest +Choices: A. green_pantry, B. red_drawer, C. green_cupboard, D. green_envelope, E. blue_treasure_chest, F. red_envelope, G. green_treasure_chest, H. blue_drawer, I. red_crate, J. green_bottle, K. green_basket, L. red_pantry, M. blue_cupboard, N. green_box, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: M. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_10/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..00b9ef6aa51e3e1679735c619d60293ceb538ae0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_10/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where is the orange really? +Answer: red_container +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: J. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_10/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cdb29ffb87edf55de4be81e5814e34f273987680 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_10/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Hannah really think the orange is? +Answer: red_pantry +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: B. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_10/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2f7a69c97c75deb7f28e1e1ba4e43a16b707c49f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_10/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Aiden think Hannah thinks the orange is? +Answer: red_pantry +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: J. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_10/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..0bdead1fcd80f8492b07825cee36b0d8b1114a94 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_10/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Jack think Aiden thinks Hannah thinks the orange is? +Answer: red_pantry +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: J. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_10/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b33814e3e2098e9f8af53a24943214162e29ed79 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_10/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jack, Alexander, Chloe and Aiden entered the master_bedroom. +2 The orange is in the red_pantry. +3 Hannah made no movements and stayed in the master_bedroom for 1 minute. +4 Hannah exited the master_bedroom. +5 Jack moved the orange to the blue_treasure_chest. +6 Jack exited the master_bedroom. +7 Alexander made no movements and stayed in the master_bedroom for 1 minute. +8 Alexander exited the master_bedroom. +9 Chloe moved the orange to the red_container. +10 Chloe exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 Hannah, Jack, Alexander, Chloe and Aiden entered the waiting_room. +14 Aiden, Hannah and Jack entered the front_yard. +15 The pear is in the red_box. +16 Aiden moved the pear to the green_pantry. +17 Aiden exited the front_yard. +18 Hannah moved the pear to the green_envelope. +19 Hannah exited the front_yard. +20 Jack made no movements and stayed in the front_yard for 1 minute. +21 Jack exited the front_yard. +22 Aiden, Hannah and Jack entered the waiting_room. +Question: Where does Alexander think Jack thinks Aiden thinks Hannah thinks the orange is? +Answer: red_pantry +Choices: A. red_container, B. red_pantry, C. blue_treasure_chest, D. blue_pantry, E. blue_crate, F. blue_drawer, G. red_box, H. red_crate, I. green_envelope, J. green_pantry, K. green_bottle, L. red_envelope, M. green_drawer, N. blue_bathtub, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: B. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_11/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c397e302cac24e9268897ee55ea35f35316ee524 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_11/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where is the cherry really? +Answer: blue_suitcase +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: N. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_11/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7e8057630166c6147e2e0bd312e56ae34f8dbcd2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_11/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Avery really think the cherry is? +Answer: blue_suitcase +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: N. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_11/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2d94cfcbc952e6f16e8b9fbb5fcc5f97385811cf --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_11/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Lily think Avery thinks the cherry is? +Answer: red_container +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: F. red_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_11/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..306fdbc0cf82cbb4550e4ec94cc4ac637017d7f3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_11/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Ella think Lily thinks Avery thinks the cherry is? +Answer: red_container +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: H. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_11/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..52073f60dfde26b30c59d9b55dfaa46edc9dedfb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_11/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Lily, Emma, Avery and Ella entered the pantry. +2 The cherry is in the red_drawer. +3 Emily moved the cherry to the red_container. +4 Emily exited the pantry. +5 Lily made no movements and stayed in the pantry for 1 minute. +6 Lily exited the pantry. +7 Emma moved the cherry to the green_envelope. +8 Emma exited the pantry. +9 Avery moved the cherry to the blue_suitcase. +10 Avery exited the pantry. +11 Ella made no movements and stayed in the pantry for 1 minute. +12 Ella exited the pantry. +13 Emily, Lily, Emma, Avery and Ella entered the waiting_room. +14 Lily, Avery and Ella entered the cellar. +15 The tomato is in the blue_container. +16 Lily made no movements and stayed in the cellar for 1 minute. +17 Lily exited the cellar. +18 Avery moved the tomato to the red_bucket. +19 Lily likes the red_drawer. +20 Avery exited the cellar. +21 Ella made no movements and stayed in the cellar for 1 minute. +22 Ella exited the cellar. +23 Lily, Avery and Ella entered the waiting_room. +Question: Where does Emily think Ella thinks Lily thinks Avery thinks the cherry is? +Answer: red_container +Choices: A. green_bucket, B. red_crate, C. green_bathtub, D. blue_treasure_chest, E. blue_pantry, F. red_container, G. red_drawer, H. blue_suitcase, I. green_envelope, J. green_treasure_chest, K. red_basket, L. blue_container, M. blue_crate, N. red_bucket, O. blue_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: F. red_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_12/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..274894c00bd02326dda451dde4b3693286590c7c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_12/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where is the pear really? +Answer: red_bucket +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: M. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_12/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..05c10907638693615847d3f34ee51eddeb1561ab --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_12/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does Charlotte really think the pear is? +Answer: red_bucket +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: E. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_12/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..969be9180870ac55e139d73fe7f2002ef6616b38 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_12/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does Alexander think Charlotte thinks the pear is? +Answer: red_bucket +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: E. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_12/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..fdcd922a51d97d80a94ba356d0699f1de9fc2286 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_12/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does Ava think Alexander thinks Charlotte thinks the pear is? +Answer: red_box +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: M. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_12/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5fa797eeeeed740c002afb079c102330a4bebb46 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_12/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Ava, Charlotte, Avery and Alexander entered the pantry. +2 The pear is in the red_box. +3 William made no movements and stayed in the pantry for 1 minute. +4 William exited the pantry. +5 Ava made no movements and stayed in the pantry for 1 minute. +6 Ava exited the pantry. +7 Charlotte moved the pear to the red_bucket. +8 Charlotte exited the pantry. +9 Avery made no movements and stayed in the pantry for 1 minute. +10 Avery exited the pantry. +11 Alexander made no movements and stayed in the pantry for 1 minute. +12 Alexander exited the pantry. +13 William, Ava, Charlotte, Avery and Alexander entered the waiting_room. +14 Alexander, Charlotte and Ava entered the office. +15 The asparagus is in the red_basket. +16 Alexander moved the asparagus to the red_drawer. +17 Avery dislikes the pear. +18 Alexander exited the office. +19 Charlotte moved the asparagus to the red_pantry. +20 Charlotte exited the office. +21 Avery dislikes the cabbage. +22 Ava made no movements and stayed in the office for 1 minute. +23 Ava exited the office. +24 Alexander, Charlotte and Ava entered the waiting_room. +Question: Where does William think Ava thinks Alexander thinks Charlotte thinks the pear is? +Answer: red_box +Choices: A. red_drawer, B. red_basket, C. green_box, D. green_bottle, E. red_pantry, F. green_bathtub, G. red_bottle, H. red_container, I. red_crate, J. green_treasure_chest, K. green_bucket, L. red_box, M. red_bucket, N. blue_suitcase, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: M. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_13/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0aab48fa87ca5f2408abbd833ed6e5ab2181e766 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_13/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where is the watermelon really? +Answer: green_basket +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: D. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_13/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d14c2ad699999577a151f53690197975dd99f076 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_13/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Carter really think the watermelon is? +Answer: green_basket +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: L. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_13/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7ff77428a23eb9c9da411ad9aed51b157cf98795 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_13/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Avery think Carter thinks the watermelon is? +Answer: blue_suitcase +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: D. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_13/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..446e993854f33b974565a464ceafb98726afcce8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_13/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Isla think Avery thinks Carter thinks the watermelon is? +Answer: blue_suitcase +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: D. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_13/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..db778f3dc0d693ea07089e100ed6e31bb43c8893 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_13/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Sophia, Carter, Emily and Isla entered the workshop. +2 The watermelon is in the blue_suitcase. +3 Avery made no movements and stayed in the workshop for 1 minute. +4 Avery exited the workshop. +5 Sophia moved the watermelon to the green_envelope. +6 Sophia exited the workshop. +7 Avery dislikes the tomato. +8 Carter moved the watermelon to the green_basket. +9 Carter exited the workshop. +10 Emily made no movements and stayed in the workshop for 1 minute. +11 Emily exited the workshop. +12 Isla made no movements and stayed in the workshop for 1 minute. +13 Isla exited the workshop. +14 Avery, Sophia, Carter, Emily and Isla entered the waiting_room. +15 Carter likes the green_treasure_chest. +16 Emily, Isla and Avery entered the sunroom. +17 The carrot is in the blue_treasure_chest. +18 Emily moved the carrot to the green_box. +19 Emily exited the sunroom. +20 Isla moved the carrot to the green_crate. +21 Isla exited the sunroom. +22 Avery made no movements and stayed in the sunroom for 1 minute. +23 Avery exited the sunroom. +24 Emily, Isla and Avery entered the waiting_room. +Question: Where does Sophia think Isla thinks Avery thinks Carter thinks the watermelon is? +Answer: blue_suitcase +Choices: A. green_envelope, B. blue_suitcase, C. red_envelope, D. green_basket, E. blue_bucket, F. green_cupboard, G. blue_treasure_chest, H. green_crate, I. red_drawer, J. green_box, K. green_drawer, L. green_treasure_chest, M. green_bathtub, N. blue_pantry, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: D. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_14/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..63985ae2923675918b6bd1d6e620dc808e1b3432 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_14/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where is the lemon really? +Answer: green_bottle +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: K. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_14/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2fccad3f4de738cfec383f854273099970561d89 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_14/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Isla really think the lemon is? +Answer: red_container +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: M. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_14/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..dc2ac5296b006c783fbb9971f12106f21e30e669 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_14/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Sophia think Isla thinks the lemon is? +Answer: red_container +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: M. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_14/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..549fe8f9865be191ae49cef25481b9ccff18adbb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_14/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Evelyn think Sophia thinks Isla thinks the lemon is? +Answer: red_container +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: M. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_14/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..41352c03e08da0cd390f950ec229615aab476e0c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_14/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isla, Alexander, Emma and Sophia entered the hall. +2 The lemon is in the red_box. +3 Evelyn moved the lemon to the red_container. +4 Evelyn exited the hall. +5 Isla made no movements and stayed in the hall for 1 minute. +6 Isla exited the hall. +7 Alexander moved the lemon to the green_treasure_chest. +8 Alexander exited the hall. +9 Emma moved the lemon to the green_bottle. +10 Emma exited the hall. +11 Sophia made no movements and stayed in the hall for 1 minute. +12 Sophia exited the hall. +13 Evelyn, Isla, Alexander, Emma and Sophia entered the waiting_room. +14 Alexander, Emma and Evelyn entered the TV_room. +15 The pear is in the red_basket. +16 Alexander made no movements and stayed in the TV_room for 1 minute. +17 Alexander exited the TV_room. +18 Emma moved the pear to the blue_treasure_chest. +19 Emma exited the TV_room. +20 Emma dislikes the eggplant. +21 Evelyn made no movements and stayed in the TV_room for 1 minute. +22 Evelyn exited the TV_room. +23 Alexander, Emma and Evelyn entered the waiting_room. +Question: Where does Alexander think Evelyn thinks Sophia thinks Isla thinks the lemon is? +Answer: red_container +Choices: A. red_basket, B. blue_treasure_chest, C. green_crate, D. blue_cupboard, E. red_bottle, F. blue_crate, G. green_pantry, H. green_bucket, I. green_box, J. blue_drawer, K. green_bottle, L. red_box, M. green_treasure_chest, N. blue_bathtub, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: M. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_15/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..99e307ae46a28bfae6250ad0bdac64c8daa01494 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_15/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where is the corn really? +Answer: green_bucket +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: E. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_15/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..553c06f5fca36e2789999a47693931e88d308993 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_15/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Abigail really think the corn is? +Answer: green_bucket +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: E. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_15/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1b96f1c87b3ebdc038ef923d36418c8932518e6a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_15/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Nathan think Abigail thinks the corn is? +Answer: green_bathtub +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: E. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_15/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..250876621bedb0f0bdc71fb12104024b929368d7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_15/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Avery think Nathan thinks Abigail thinks the corn is? +Answer: green_bathtub +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: E. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_15/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2555c9437dacb196450de1474f2ad9690ce15ee3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_15/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, William, Abigail, Nathan and Avery entered the basement. +2 The corn is in the red_basket. +3 Hannah moved the corn to the green_bathtub. +4 Hannah exited the basement. +5 Avery likes the green_crate. +6 William made no movements and stayed in the basement for 1 minute. +7 William exited the basement. +8 Abigail made no movements and stayed in the basement for 1 minute. +9 Abigail exited the basement. +10 Nathan made no movements and stayed in the basement for 1 minute. +11 Hannah dislikes the corn. +12 Nathan exited the basement. +13 Avery moved the corn to the red_basket. +14 Avery exited the basement. +15 Hannah, William, Abigail, Nathan and Avery entered the waiting_room. +16 Nathan lost his watch. +17 Hannah, Abigail and William entered the basement. +18 The corn is in the red_basket. +19 Hannah made no movements and stayed in the basement for 1 minute. +20 Hannah exited the basement. +21 Abigail moved the corn to the green_bucket. +22 Abigail exited the basement. +23 William made no movements and stayed in the basement for 1 minute. +24 William exited the basement. +25 Hannah, Abigail and William entered the waiting_room. +Question: Where does Hannah think Avery thinks Nathan thinks Abigail thinks the corn is? +Answer: green_bathtub +Choices: A. red_basket, B. red_bucket, C. green_bathtub, D. blue_suitcase, E. green_bucket, F. blue_bathtub, G. green_cupboard, H. red_pantry, I. red_bottle, J. blue_treasure_chest, K. green_box, L. green_envelope, M. green_crate, N. green_treasure_chest, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: E. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_16/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..48b55dd0e55a2285c1abe0cab2f5a2ae53cb9b72 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_16/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where is the tangerine really? +Answer: green_bottle +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: J. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_16/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ef2f70da63e000579e8c3b2e9a2fe0ab3046e307 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_16/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Benjamin really think the tangerine is? +Answer: red_bucket +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: J. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_16/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..88bdd8a1f8a9e0ef964795366df0bf4f9fc0227d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_16/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Liam think Benjamin thinks the tangerine is? +Answer: blue_treasure_chest +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: J. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_16/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d0ec8a019411e5139696090042d3af20fc77ffb2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_16/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Carter think Liam thinks Benjamin thinks the tangerine is? +Answer: blue_treasure_chest +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: I. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_16/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9ee40fb0814075c452afe28ec9ddac9310c64e06 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_16/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Jackson, Carter, Benjamin and Sophia entered the den. +2 The tangerine is in the green_bottle. +3 Liam moved the tangerine to the blue_treasure_chest. +4 Sophia dislikes the banana. +5 Liam exited the den. +6 Jackson moved the tangerine to the green_bathtub. +7 Jackson exited the den. +8 Carter made no movements and stayed in the den for 1 minute. +9 Carter exited the den. +10 Benjamin moved the tangerine to the red_bucket. +11 Benjamin exited the den. +12 Sophia moved the tangerine to the green_bottle. +13 Sophia exited the den. +14 Liam, Jackson, Carter, Benjamin and Sophia entered the waiting_room. +15 Benjamin, Liam and Carter entered the bathroom. +16 The plum is in the blue_suitcase. +17 Benjamin moved the plum to the green_crate. +18 Benjamin exited the bathroom. +19 Liam moved the plum to the red_drawer. +20 Liam exited the bathroom. +21 Jackson dislikes the tangerine. +22 Carter made no movements and stayed in the bathroom for 1 minute. +23 Benjamin lost his phone. +24 Carter exited the bathroom. +25 Benjamin, Liam and Carter entered the waiting_room. +Question: Where does Jackson think Carter thinks Liam thinks Benjamin thinks the tangerine is? +Answer: blue_treasure_chest +Choices: A. red_pantry, B. blue_bottle, C. red_basket, D. green_box, E. red_bottle, F. blue_suitcase, G. blue_crate, H. green_bucket, I. green_crate, J. red_drawer, K. red_bucket, L. green_bottle, M. blue_treasure_chest, N. green_bathtub, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: I. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_17/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4768e014945c82dc87cee6e70b2840c5782aeb4c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_17/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where is the lime really? +Answer: green_pantry +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: N. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_17/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..28ce8f96ae745b2b629afaf4f07981d0d49129cb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_17/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Owen really think the lime is? +Answer: blue_drawer +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: C. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_17/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ebcc08ca0b8076a708aac7be5d530802b014e8a6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_17/order_2.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Emily think Owen thinks the lime is? +Answer: blue_drawer +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_17/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..69e0b3c922d74624043708b4d1195630492585aa --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_17/order_3.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Lily think Emily thinks Owen thinks the lime is? +Answer: blue_drawer +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_17/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..617c020364b8d7d6a688f103b3e762148c3d489c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_17/order_4.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Ella, Owen, Evelyn and Emily entered the front_yard. +2 Ella likes the red_bottle. +3 The lime is in the red_bottle. +4 Lily moved the lime to the blue_drawer. +5 Lily exited the front_yard. +6 Ella made no movements and stayed in the front_yard for 1 minute. +7 Ella exited the front_yard. +8 Owen made no movements and stayed in the front_yard for 1 minute. +9 Owen exited the front_yard. +10 Evelyn moved the lime to the green_pantry. +11 Evelyn dislikes the asparagus. +12 Evelyn exited the front_yard. +13 Emily made no movements and stayed in the front_yard for 1 minute. +14 Emily exited the front_yard. +15 Lily, Ella, Owen, Evelyn and Emily entered the waiting_room. +16 Lily, Emily and Ella entered the attic. +17 The lettuce is in the green_basket. +18 Owen likes the blue_drawer. +19 Lily made no movements and stayed in the attic for 1 minute. +20 Lily exited the attic. +21 Emily made no movements and stayed in the attic for 1 minute. +22 Lily lost his phone. +23 Emily exited the attic. +24 Ella moved the lettuce to the green_cupboard. +25 Ella exited the attic. +26 Lily, Emily and Ella entered the waiting_room. +Question: Where does Ella think Lily thinks Emily thinks Owen thinks the lime is? +Answer: blue_drawer +Choices: A. red_bottle, B. green_pantry, C. blue_drawer, D. green_bathtub, E. blue_container, F. blue_crate, G. red_drawer, H. blue_bathtub, I. red_envelope, J. red_basket, K. green_bucket, L. green_basket, M. red_bucket, N. green_bottle, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: B. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_18/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c6a98aeed5bdbb68ffbebcc0013fdbbec4b9f2dd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_18/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where is the corn really? +Answer: blue_container +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: M. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_18/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc021a17bf7b3dffbdcf43569bb2801cf239060b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_18/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Noah really think the corn is? +Answer: blue_treasure_chest +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: M. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_18/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d2807fd6652b9e37e0ef0552345f03ca2380897d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_18/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Lily think Noah thinks the corn is? +Answer: blue_treasure_chest +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: K. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_18/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f8cfda895ae9f995674f3f8b9e399b17556799e7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_18/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Isla think Lily thinks Noah thinks the corn is? +Answer: blue_treasure_chest +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: I. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_18/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f7fe3c8b873d6a8b293f7fdefa847080cd0d8482 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_18/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isla, Noah, Sophia and Lily entered the staircase. +2 The corn is in the blue_treasure_chest. +3 Mila made no movements and stayed in the staircase for 1 minute. +4 Mila exited the staircase. +5 Isla made no movements and stayed in the staircase for 1 minute. +6 Noah dislikes the green_pepper. +7 Isla exited the staircase. +8 Noah made no movements and stayed in the staircase for 1 minute. +9 Noah exited the staircase. +10 Sophia moved the corn to the blue_container. +11 Sophia exited the staircase. +12 Lily made no movements and stayed in the staircase for 1 minute. +13 Sophia dislikes the tomato. +14 Lily exited the staircase. +15 Mila, Isla, Noah, Sophia and Lily entered the waiting_room. +16 Isla, Sophia and Lily entered the front_yard. +17 The tomato is in the red_box. +18 Isla made no movements and stayed in the front_yard for 1 minute. +19 Isla exited the front_yard. +20 Sophia made no movements and stayed in the front_yard for 1 minute. +21 Sophia exited the front_yard. +22 Lily moved the tomato to the green_drawer. +23 Lily exited the front_yard. +24 Isla, Sophia and Lily entered the waiting_room. +Question: Where does Mila think Isla thinks Lily thinks Noah thinks the corn is? +Answer: blue_treasure_chest +Choices: A. green_pantry, B. red_envelope, C. green_bathtub, D. red_basket, E. blue_suitcase, F. red_box, G. blue_bottle, H. blue_drawer, I. green_drawer, J. red_container, K. blue_treasure_chest, L. red_bottle, M. blue_container, N. green_envelope, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: K. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_19/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..45de1a2f4c37c46cdac6aaeeab1dd06adbb96f37 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_19/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where is the tomato really? +Answer: blue_container +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: J. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_19/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..30a05d133379f761471ff1a775eaf009d68c756d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_19/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Jackson really think the tomato is? +Answer: blue_crate +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: M. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_19/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9e11fdd5711774caa38cf5fcca8582a9ae89d78f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_19/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Nathan think Jackson thinks the tomato is? +Answer: blue_crate +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: M. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_19/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..840f6849cef5e85bbf93cd4dccaa8ae7d1013b1f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_19/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Amelia think Nathan thinks Jackson thinks the tomato is? +Answer: blue_crate +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: F. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_19/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..91a8e3df7b4ae357c2abc4412005cbf019566fca --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_19/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Jackson, Amelia, Charlotte and Nathan entered the laundry. +2 The tomato is in the blue_container. +3 Sophia moved the tomato to the blue_cupboard. +4 Sophia exited the laundry. +5 Jackson moved the tomato to the blue_crate. +6 Jackson exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Charlotte made no movements and stayed in the laundry for 1 minute. +10 Charlotte exited the laundry. +11 Nathan moved the tomato to the blue_container. +12 Nathan exited the laundry. +13 Sophia, Jackson, Amelia, Charlotte and Nathan entered the waiting_room. +14 Nathan, Jackson and Amelia entered the hall. +15 The onion is in the blue_treasure_chest. +16 Nathan made no movements and stayed in the hall for 1 minute. +17 Nathan exited the hall. +18 Jackson moved the onion to the red_envelope. +19 Jackson exited the hall. +20 Amelia moved the onion to the green_cupboard. +21 Jackson saw a mouse. +22 Amelia exited the hall. +23 Jackson lost his phone. +24 Nathan, Jackson and Amelia entered the waiting_room. +Question: Where does Sophia think Amelia thinks Nathan thinks Jackson thinks the tomato is? +Answer: blue_cupboard +Choices: A. green_bottle, B. green_pantry, C. blue_suitcase, D. red_bucket, E. green_box, F. green_cupboard, G. blue_treasure_chest, H. red_bottle, I. green_drawer, J. red_envelope, K. blue_container, L. blue_crate, M. blue_cupboard, N. red_pantry, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: F. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_2/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..850d0f3759bbf5c495765d0931b0be7708c2b5f1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_2/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where is the corn really? +Answer: red_basket +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: C. red_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_2/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..89811a42020ac08fd79eadfd1007473f2b482031 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_2/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Amelia really think the corn is? +Answer: red_basket +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: C. red_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_2/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c928352d3faa18dd46a5b5ed86b1d19a625e4b3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_2/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Lily think Amelia thinks the corn is? +Answer: red_container +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: C. red_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_2/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cff6c23072625377fe09ffd9048659028603bcc8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_2/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Sophia think Lily thinks Amelia thinks the corn is? +Answer: red_container +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: E. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_2/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0614dcc010baf537775e219e13bcc875d1d3c9ea --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_2/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Sophia, Lily, Carter and Amelia entered the hallway. +2 The corn is in the red_basket. +3 Liam moved the corn to the red_container. +4 Liam exited the hallway. +5 Sophia made no movements and stayed in the hallway for 1 minute. +6 Sophia exited the hallway. +7 Lily made no movements and stayed in the hallway for 1 minute. +8 Lily exited the hallway. +9 Carter made no movements and stayed in the hallway for 1 minute. +10 Carter exited the hallway. +11 Amelia moved the corn to the red_basket. +12 Amelia exited the hallway. +13 Liam, Sophia, Lily, Carter and Amelia entered the waiting_room. +14 Liam, Lily and Carter entered the hallway. +15 The melon is in the blue_bucket. +16 Liam moved the melon to the red_basket. +17 Liam exited the hallway. +18 Lily moved the melon to the green_pantry. +19 Lily exited the hallway. +20 Carter moved the melon to the red_container. +21 Carter exited the hallway. +22 Sophia dislikes the corn. +23 Liam, Lily and Carter entered the waiting_room. +Question: Where does Liam think Sophia thinks Lily thinks Amelia thinks the corn is? +Answer: red_container +Choices: A. blue_bucket, B. red_basket, C. red_container, D. blue_bathtub, E. green_pantry, F. red_envelope, G. blue_bottle, H. red_box, I. blue_cupboard, J. green_bathtub, K. red_drawer, L. red_bottle, M. blue_drawer, N. green_crate, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_20/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ffa8f0523612554660accb081e9ae5355b4ff67e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_20/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where is the peas really? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: D. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_20/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..26aee6a00340c37ee612737f48830cd986ca655c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_20/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Nathan really think the peas is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_20/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e8425dff020f073c92a3df1a7574d3bc5c7f2f34 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_20/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Emily think Nathan thinks the peas is? +Answer: red_basket +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: N. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_20/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..969b7000ed075dbeb64e060776936c351fe6661c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_20/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Ella think Emily thinks Nathan thinks the peas is? +Answer: red_basket +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: E. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_20/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5ed06e2c0d266af449c264ef7eb81327b5ec5be9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_20/order_4.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn dislikes the potato. +2 Emily, Ella, Avery, Evelyn and Nathan entered the bathroom. +3 The peas is in the blue_suitcase. +4 Emily moved the peas to the red_basket. +5 Emily exited the bathroom. +6 Ella moved the peas to the red_envelope. +7 Ella exited the bathroom. +8 Avery moved the peas to the blue_cupboard. +9 Avery exited the bathroom. +10 Evelyn made no movements and stayed in the bathroom for 1 minute. +11 Evelyn exited the bathroom. +12 Nathan moved the peas to the blue_suitcase. +13 Nathan exited the bathroom. +14 Emily, Ella, Avery, Evelyn and Nathan entered the waiting_room. +15 Evelyn, Avery and Nathan entered the kitchen. +16 The corn is in the red_box. +17 Evelyn made no movements and stayed in the kitchen for 1 minute. +18 Evelyn exited the kitchen. +19 Avery made no movements and stayed in the kitchen for 1 minute. +20 Avery exited the kitchen. +21 Nathan made no movements and stayed in the kitchen for 1 minute. +22 Nathan exited the kitchen. +23 Evelyn, Avery and Nathan entered the waiting_room. +Question: Where does Evelyn think Ella thinks Emily thinks Nathan thinks the peas is? +Answer: red_basket +Choices: A. blue_suitcase, B. green_envelope, C. blue_cupboard, D. red_basket, E. red_envelope, F. red_box, G. blue_bathtub, H. green_basket, I. red_crate, J. blue_container, K. blue_bucket, L. green_bottle, M. blue_treasure_chest, N. red_bucket, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: E. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_3/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b832736fe2b9a1d274026161328392608568a192 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_3/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where is the peas really? +Answer: blue_crate +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: N. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_3/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4aa5589a2ddb3137430cb0334a043367f247ffca --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_3/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Benjamin really think the peas is? +Answer: blue_crate +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: M. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_3/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1a9da27d7da11832d9010a1731a52beaf9815f25 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_3/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Noah think Benjamin thinks the peas is? +Answer: green_crate +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: M. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_3/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..117cbd2f1e8d30dcee08e5261b950a6e4a1ddb30 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_3/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Liam think Noah thinks Benjamin thinks the peas is? +Answer: blue_container +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: N. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_3/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c17acce60f4ec1dbfdd3d171724b80339e0023cf --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_3/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Noah, Avery, Mila and Benjamin entered the workshop. +2 The peas is in the green_drawer. +3 Liam moved the peas to the blue_container. +4 Liam dislikes the peas. +5 Liam exited the workshop. +6 Noah moved the peas to the green_crate. +7 Noah exited the workshop. +8 Avery moved the peas to the blue_bucket. +9 Avery exited the workshop. +10 Mila moved the peas to the blue_crate. +11 Liam saw a dog. +12 Mila exited the workshop. +13 Benjamin made no movements and stayed in the workshop for 1 minute. +14 Benjamin exited the workshop. +15 Liam, Noah, Avery, Mila and Benjamin entered the waiting_room. +16 Noah, Liam and Mila entered the den. +17 The melon is in the red_bucket. +18 Noah made no movements and stayed in the den for 1 minute. +19 Noah exited the den. +20 Liam made no movements and stayed in the den for 1 minute. +21 Liam exited the den. +22 Mila moved the melon to the blue_suitcase. +23 Mila exited the den. +24 Noah, Liam and Mila entered the waiting_room. +Question: Where does Avery think Liam thinks Noah thinks Benjamin thinks the peas is? +Answer: blue_container +Choices: A. red_bucket, B. blue_bathtub, C. blue_suitcase, D. blue_cupboard, E. green_basket, F. green_pantry, G. red_basket, H. red_envelope, I. green_treasure_chest, J. green_envelope, K. green_drawer, L. blue_container, M. blue_crate, N. blue_bucket, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: N. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_4/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3167d4cf18f64f77053ee0c85fb1b9a783772216 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_4/order_0.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where is the potato really? +Answer: blue_drawer +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_4/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3d9ec1e8ad7fb8c9b006c6337a395f0e4813261f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_4/order_1.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Isabella really think the potato is? +Answer: green_bottle +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: C. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_4/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d638a3d1e03a51d449c2e20c74eb8df0ff5d315b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_4/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Chloe think Isabella thinks the potato is? +Answer: blue_drawer +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: D. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_4/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..bfd0ff600b0aeb2c2d437867c26b50c846450d3d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_4/order_3.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Evelyn think Chloe thinks Isabella thinks the potato is? +Answer: blue_drawer +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: C. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_4/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b25a5b7fee0d86ece1cef8f20fcf42de832df65 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_4/order_4.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Mila, Isabella and Jacob entered the crawlspace. +2 The potato is in the blue_drawer. +3 Evelyn made no movements and stayed in the crawlspace for 1 minute. +4 Evelyn exited the crawlspace. +5 Chloe made no movements and stayed in the crawlspace for 1 minute. +6 Chloe exited the crawlspace. +7 Mila moved the potato to the red_basket. +8 Mila exited the crawlspace. +9 Isabella moved the potato to the green_bottle. +10 Isabella exited the crawlspace. +11 Jacob moved the potato to the blue_drawer. +12 Jacob exited the crawlspace. +13 Evelyn, Chloe, Mila, Isabella and Jacob entered the waiting_room. +14 Evelyn, Mila and Jacob entered the closet. +15 The watermelon is in the green_crate. +16 Evelyn moved the watermelon to the blue_suitcase. +17 Evelyn exited the closet. +18 Mila moved the watermelon to the red_drawer. +19 Mila exited the closet. +20 Jacob made no movements and stayed in the closet for 1 minute. +21 Jacob exited the closet. +22 Evelyn, Mila and Jacob entered the waiting_room. +Question: Where does Jacob think Evelyn thinks Chloe thinks Isabella thinks the potato is? +Answer: blue_drawer +Choices: A. blue_treasure_chest, B. blue_drawer, C. green_bottle, D. red_basket, E. red_box, F. red_drawer, G. green_crate, H. green_treasure_chest, I. green_box, J. blue_suitcase, K. blue_crate, L. green_basket, M. blue_bathtub, N. red_crate, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: C. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_5/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5dc3d326a4979ab1ceee82df689ef2d48fc6607e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_5/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where is the cabbage really? +Answer: green_envelope +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: C. green_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_5/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..14fd989915d92eeaae3690e7775f1bbc06b0e0dc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_5/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Avery really think the cabbage is? +Answer: green_envelope +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_5/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8f2f33c1240a3e4ac91af5044bcae6017ad083fd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_5/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Aiden think Avery thinks the cabbage is? +Answer: green_box +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_5/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5986c6df51f059d6f870378f8e77bcb6c9f0f8fa --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_5/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Emma think Aiden thinks Avery thinks the cabbage is? +Answer: green_box +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_5/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2f43b8386b817dc35911727dd5799781accf9639 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_5/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Emma, Avery, Aiden and Jackson entered the staircase. +2 The cabbage is in the green_envelope. +3 Noah moved the cabbage to the green_box. +4 Emma likes the red_envelope. +5 Noah exited the staircase. +6 Emma made no movements and stayed in the staircase for 1 minute. +7 Emma exited the staircase. +8 Avery made no movements and stayed in the staircase for 1 minute. +9 Avery exited the staircase. +10 Aiden made no movements and stayed in the staircase for 1 minute. +11 Aiden exited the staircase. +12 Jackson made no movements and stayed in the staircase for 1 minute. +13 Jackson exited the staircase. +14 Noah, Emma, Avery, Aiden and Jackson entered the waiting_room. +15 Aiden likes the blue_bucket. +16 Aiden, Avery and Jackson entered the staircase. +17 The cabbage is in the green_box. +18 Aiden made no movements and stayed in the staircase for 1 minute. +19 Aiden exited the staircase. +20 Avery moved the cabbage to the green_envelope. +21 Avery exited the staircase. +22 Jackson made no movements and stayed in the staircase for 1 minute. +23 Jackson exited the staircase. +24 Aiden, Avery and Jackson entered the waiting_room. +Question: Where does Noah think Emma thinks Aiden thinks Avery thinks the cabbage is? +Answer: green_box +Choices: A. red_envelope, B. green_envelope, C. green_box, D. blue_bucket, E. blue_pantry, F. green_basket, G. blue_drawer, H. red_container, I. green_bucket, J. green_bathtub, K. red_box, L. green_crate, M. blue_container, N. green_drawer, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_6/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ded090b4ab9c1cc8cf0a3a51a979cd1a99823f89 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_6/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where is the melon really? +Answer: red_pantry +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: C. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_6/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8c6e22735d64bdf4ebc4621ff4ba45b111dc0ecf --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_6/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Owen really think the melon is? +Answer: green_basket +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: G. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_6/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a264fdcedf37b6b943ad95bda901fb59f4aa22a1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_6/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Avery think Owen thinks the melon is? +Answer: green_basket +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: G. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_6/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d43fcf6faafefc64eb0546b098b21adda6db86bc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_6/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Benjamin think Avery thinks Owen thinks the melon is? +Answer: green_basket +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: G \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_6/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1962c83ccbb79af72feda4041b84ef715b734baf --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_6/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Avery, Benjamin, Mila and Noah entered the bedroom. +2 The melon is in the red_pantry. +3 Owen moved the melon to the green_basket. +4 Owen exited the bedroom. +5 Avery saw a monkey. +6 Avery made no movements and stayed in the bedroom for 1 minute. +7 Avery exited the bedroom. +8 Owen likes the red_basket. +9 Benjamin made no movements and stayed in the bedroom for 1 minute. +10 Benjamin exited the bedroom. +11 Mila moved the melon to the green_box. +12 Mila exited the bedroom. +13 Noah moved the melon to the red_pantry. +14 Noah exited the bedroom. +15 Owen, Avery, Benjamin, Mila and Noah entered the waiting_room. +16 Noah, Avery and Mila entered the dining_room. +17 The sweet_potato is in the red_basket. +18 Noah moved the sweet_potato to the green_bucket. +19 Noah exited the dining_room. +20 Avery moved the sweet_potato to the blue_container. +21 Avery exited the dining_room. +22 Owen saw a dog. +23 Mila made no movements and stayed in the dining_room for 1 minute. +24 Mila exited the dining_room. +25 Noah, Avery and Mila entered the waiting_room. +Question: Where does Noah think Benjamin thinks Avery thinks Owen thinks the melon is? +Answer: green_basket +Choices: A. red_basket, B. green_crate, C. green_bucket, D. blue_container, E. red_crate, F. red_pantry, G. green_basket, H. green_pantry, I. blue_bucket, J. green_box, K. red_drawer, L. red_box, M. blue_cupboard, N. green_envelope, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: C. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_7/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1bd210b98c158fb246c3822b0f260ae6666825ed --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_7/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where is the melon really? +Answer: blue_treasure_chest +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: J. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_7/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..81f46015b0acd7ed9b07c95057875151da287747 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_7/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Nathan really think the melon is? +Answer: blue_treasure_chest +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: J. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_7/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f1c7ac8f8342abb20aa870ab56a64f93d9303917 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_7/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Lily think Nathan thinks the melon is? +Answer: blue_treasure_chest +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: J. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_7/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..097cec03480aaf8f9557d5b47840b8ac300905ee --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_7/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Isabella think Lily thinks Nathan thinks the melon is? +Answer: green_treasure_chest +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: H. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_7/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9abf05e4f1cdd26f4db928f63b2bdcf7eb94fab4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_7/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Isabella, Nathan, Ava and Lily entered the hallway. +2 The melon is in the blue_container. +3 Evelyn moved the melon to the green_treasure_chest. +4 Evelyn exited the hallway. +5 Lily dislikes the cucumber. +6 Isabella made no movements and stayed in the hallway for 1 minute. +7 Isabella exited the hallway. +8 Nathan moved the melon to the blue_treasure_chest. +9 Nathan exited the hallway. +10 Ava made no movements and stayed in the hallway for 1 minute. +11 Ava exited the hallway. +12 Lily made no movements and stayed in the hallway for 1 minute. +13 Ava dislikes the spinach. +14 Lily exited the hallway. +15 Evelyn, Isabella, Nathan, Ava and Lily entered the waiting_room. +16 Nathan, Isabella and Evelyn entered the cellar. +17 The spinach is in the red_crate. +18 Nathan moved the spinach to the blue_bottle. +19 Nathan exited the cellar. +20 Isabella moved the spinach to the red_bottle. +21 Isabella exited the cellar. +22 Nathan lost his phone. +23 Evelyn made no movements and stayed in the cellar for 1 minute. +24 Evelyn exited the cellar. +25 Nathan, Isabella and Evelyn entered the waiting_room. +Question: Where does Ava think Isabella thinks Lily thinks Nathan thinks the melon is? +Answer: green_treasure_chest +Choices: A. blue_pantry, B. green_bottle, C. red_envelope, D. green_cupboard, E. green_crate, F. green_box, G. red_crate, H. red_bottle, I. blue_cupboard, J. blue_bottle, K. blue_container, L. blue_bathtub, M. red_bucket, N. blue_treasure_chest, O. green_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: H. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_8/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3b90659e754370a8d27eeac69c041585e7c7113a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_8/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where is the watermelon really? +Answer: blue_treasure_chest +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: E. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_8/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..06e939b48a8e7cf721bcd99eea40d774f111ce98 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_8/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Noah really think the watermelon is? +Answer: blue_treasure_chest +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: Noah really thinks the watermelon is in the green_bucket. + +Answer: A. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_8/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b7bf82299d2604750c6696f73344c2f8e989db53 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_8/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Emma think Noah thinks the watermelon is? +Answer: green_bucket +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: E. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_8/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..adb06574adc516adf81d726c5bc848a00b962fa3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_8/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Liam think Emma thinks Noah thinks the watermelon is? +Answer: green_bucket +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: E. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_8/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..77c94e624e947109b07fedf4bfdebf434041d169 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_8/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Abigail, Owen, Emma and Liam entered the hall. +2 The watermelon is in the green_bucket. +3 Noah made no movements and stayed in the hall for 1 minute. +4 Noah exited the hall. +5 Abigail made no movements and stayed in the hall for 1 minute. +6 Abigail exited the hall. +7 Owen made no movements and stayed in the hall for 1 minute. +8 Emma dislikes the melon. +9 Owen exited the hall. +10 Emma moved the watermelon to the blue_treasure_chest. +11 Emma exited the hall. +12 Liam made no movements and stayed in the hall for 1 minute. +13 Liam exited the hall. +14 Noah, Abigail, Owen, Emma and Liam entered the waiting_room. +15 Noah, Owen and Liam entered the hall. +16 The persimmon is in the blue_bathtub. +17 Noah made no movements and stayed in the hall for 1 minute. +18 Liam saw a dog. +19 Noah exited the hall. +20 Owen moved the persimmon to the green_crate. +21 Owen exited the hall. +22 Liam moved the persimmon to the green_bathtub. +23 Liam exited the hall. +24 Noah, Owen and Liam entered the waiting_room. +Question: Where does Owen think Liam thinks Emma thinks Noah thinks the watermelon is? +Answer: green_bucket +Choices: A. green_bucket, B. blue_bathtub, C. green_crate, D. green_bathtub, E. blue_treasure_chest, F. green_basket, G. green_drawer, H. red_bucket, I. blue_drawer, J. blue_pantry, K. blue_suitcase, L. blue_bucket, M. red_crate, N. blue_bottle, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: D. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_9/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7bea19b2198083c17f84d3c0bfec180c173d4dd6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_9/order_0.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where is the carrot really? +Answer: red_basket +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: D. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_9/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d8d327f7493660dfc73d9c743cb2c34db2cebc40 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_9/order_1.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Noah really think the carrot is? +Answer: red_basket +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: A. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_9/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..dd81d12c715fe24e2de35c04113000981e6c09a6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_9/order_2.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Owen think Noah thinks the carrot is? +Answer: green_drawer +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: J. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_9/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4200bb49b877acebeb5d6d1898c1a910a49885cb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_9/order_3.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Mila think Owen thinks Noah thinks the carrot is? +Answer: red_pantry +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: L. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_9/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..50f7297ba58baf1e3693a752ddde786c875a74ce --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_2/sample_9/order_4.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Mila, Owen, Lily and Noah entered the hall. +2 The carrot is in the red_basket. +3 Evelyn moved the carrot to the red_pantry. +4 Evelyn exited the hall. +5 Mila made no movements and stayed in the hall for 1 minute. +6 Mila exited the hall. +7 Owen moved the carrot to the green_drawer. +8 Mila saw a cat. +9 Owen exited the hall. +10 Lily moved the carrot to the red_envelope. +11 Lily exited the hall. +12 Noah moved the carrot to the red_basket. +13 Owen lost his watch. +14 Noah exited the hall. +15 Owen likes the red_basket. +16 Evelyn, Mila, Owen, Lily and Noah entered the waiting_room. +17 Owen dislikes the spinach. +18 Noah, Mila and Owen entered the sunroom. +19 The cherry is in the blue_crate. +20 Mila dislikes the spinach. +21 Noah made no movements and stayed in the sunroom for 1 minute. +22 Owen likes the green_treasure_chest. +23 Noah exited the sunroom. +24 Mila moved the cherry to the green_bucket. +25 Mila exited the sunroom. +26 Owen made no movements and stayed in the sunroom for 1 minute. +27 Owen exited the sunroom. +28 Noah, Mila and Owen entered the waiting_room. +Question: Where does Lily think Mila thinks Owen thinks Noah thinks the carrot is? +Answer: red_pantry +Choices: A. red_basket, B. green_drawer, C. red_pantry, D. red_envelope, E. blue_drawer, F. green_cupboard, G. green_bathtub, H. red_box, I. red_drawer, J. green_treasure_chest, K. blue_crate, L. green_basket, M. blue_bathtub, N. green_bottle, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: D. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_1/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d437c919f204cb283f89272db2502933fcce7b3a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_1/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where is the lettuce really? +Answer: blue_container +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: J. red_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_1/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1ed2ec942ccdb1ffaf5da3964d3b899f5b7197cb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_1/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Isabella really think the lettuce is? +Answer: blue_container +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: K. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_1/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c7faf06448064a4302e6b01cd4996bd32b975f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_1/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Abigail think Isabella thinks the lettuce is? +Answer: red_basket +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: K. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_1/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4115a33d19f291fc807c9cdfe4448501709d8145 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_1/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Nathan think Abigail thinks Isabella thinks the lettuce is? +Answer: green_cupboard +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_cupboard +GPT-4 Explain: J. red_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_1/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b953746d3e2eb4e7146722e697f5be59d54529fc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_1/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Logan, Jackson, Abigail and Isabella entered the back_yard. +2 The lettuce is in the blue_container. +3 Nathan moved the lettuce to the green_cupboard. +4 Nathan exited the back_yard. +5 Logan moved the lettuce to the blue_treasure_chest. +6 Logan exited the back_yard. +7 Jackson made no movements and stayed in the back_yard for 1 minute. +8 Jackson exited the back_yard. +9 Abigail moved the lettuce to the red_basket. +10 Abigail exited the back_yard. +11 Isabella moved the lettuce to the blue_container. +12 Logan dislikes the corn. +13 Isabella exited the back_yard. +14 Nathan, Logan, Jackson, Abigail and Isabella entered the waiting_room. +15 Jackson, Nathan and Logan entered the playroom. +16 The melon is in the green_box. +17 Jackson made no movements and stayed in the playroom for 1 minute. +18 Nathan dislikes the lettuce. +19 Jackson exited the playroom. +20 Nathan made no movements and stayed in the playroom for 1 minute. +21 Nathan exited the playroom. +22 Logan moved the melon to the red_crate. +23 Logan exited the playroom. +24 Jackson, Nathan and Logan entered the waiting_room. +25 Isabella, Jackson, Abigail and Nathan entered the hallway. +26 The tangerine is in the blue_bottle. +27 Isabella moved the tangerine to the red_box. +28 Isabella exited the hallway. +29 Jackson made no movements and stayed in the hallway for 1 minute. +30 Jackson exited the hallway. +31 Abigail moved the tangerine to the blue_bathtub. +32 Abigail exited the hallway. +33 Logan dislikes the lettuce. +34 Nathan moved the tangerine to the red_container. +35 Nathan exited the hallway. +36 Isabella, Jackson, Abigail and Nathan entered the waiting_room. +Question: Where does Logan think Nathan thinks Abigail thinks Isabella thinks the lettuce is? +Answer: green_cupboard +Choices: A. red_crate, B. green_box, C. green_bathtub, D. red_drawer, E. blue_cupboard, F. blue_bottle, G. blue_bathtub, H. red_box, I. blue_crate, J. red_container, K. blue_container, L. red_basket, M. red_bucket, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_cupboard +GPT-4 Explain: J. red_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_10/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c845d2f419c069dbb25058c69ea52cfe026829bb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_10/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where is the sweet_potato really? +Answer: red_container +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: O. red_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_10/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ebccb44d908fd7cacd45b76b4a02100b45fd9f5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_10/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does Evelyn really think the sweet_potato is? +Answer: blue_cupboard +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: L. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_10/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..13f6c535f20a1c9cf6b085b576e7ab973cb0e983 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_10/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does Logan think Evelyn thinks the sweet_potato is? +Answer: red_container +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: J. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_10/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5358756293584f41002351016c6ffb94af8e7e4a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_10/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does Charlotte think Logan thinks Evelyn thinks the sweet_potato is? +Answer: red_container +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: J. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_10/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e2ec2e68e21186677ce170c389fd943ff4029983 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_10/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Ava, Evelyn, Charlotte and William entered the kitchen. +2 The sweet_potato is in the red_container. +3 Ava saw a mouse. +4 Logan made no movements and stayed in the kitchen for 1 minute. +5 Logan exited the kitchen. +6 Ava moved the sweet_potato to the blue_cupboard. +7 Ava exited the kitchen. +8 Evelyn made no movements and stayed in the kitchen for 1 minute. +9 Evelyn exited the kitchen. +10 Charlotte moved the sweet_potato to the green_drawer. +11 Charlotte exited the kitchen. +12 William moved the sweet_potato to the red_container. +13 William exited the kitchen. +14 Logan, Ava, Evelyn, Charlotte and William entered the waiting_room. +15 Ava, Logan and Evelyn entered the hallway. +16 The peas is in the red_basket. +17 Ava made no movements and stayed in the hallway for 1 minute. +18 Ava exited the hallway. +19 Logan made no movements and stayed in the hallway for 1 minute. +20 Logan exited the hallway. +21 Evelyn moved the peas to the green_bathtub. +22 Evelyn exited the hallway. +23 Ava, Logan and Evelyn entered the waiting_room. +24 Logan lost his phone. +25 William, Logan, Evelyn and Charlotte entered the bedroom. +26 Charlotte likes the green_bathtub. +27 The banana is in the green_cupboard. +28 William moved the banana to the green_bottle. +29 William exited the bedroom. +30 Logan moved the banana to the green_envelope. +31 Logan exited the bedroom. +32 Evelyn moved the banana to the red_crate. +33 Evelyn exited the bedroom. +34 Charlotte moved the banana to the green_pantry. +35 Charlotte exited the bedroom. +36 William, Logan, Evelyn and Charlotte entered the waiting_room. +Question: Where does William think Charlotte thinks Logan thinks Evelyn thinks the sweet_potato is? +Answer: red_container +Choices: A. blue_pantry, B. red_basket, C. green_bathtub, D. blue_drawer, E. blue_bottle, F. red_container, G. blue_cupboard, H. green_basket, I. green_box, J. green_drawer, K. green_cupboard, L. green_pantry, M. green_envelope, N. green_bottle, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: K. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_11/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c9d59cdc48bfe2d8e55737121df35461d02a6660 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_11/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where is the melon really? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: I. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_11/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..796dc58f3d45fb5431dfa780a6da063d35687a6f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_11/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does William really think the melon is? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: D. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_11/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a36375fe263be31cfcda4daba855f9536c586dda --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_11/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does Lily think William thinks the melon is? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: C. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_11/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d108f8afff243f2359ee233daa6917c998df34e2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_11/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does Emma think Lily thinks William thinks the melon is? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: M. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_11/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7bdae8f7022bef5634fca73a13aaa1f65206d3ed --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_11/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Lily, Aiden, Emma and Isla entered the porch. +2 The melon is in the green_bathtub. +3 William made no movements and stayed in the porch for 1 minute. +4 William exited the porch. +5 Lily made no movements and stayed in the porch for 1 minute. +6 Lily exited the porch. +7 Aiden moved the melon to the blue_pantry. +8 Lily likes the green_bucket. +9 Aiden exited the porch. +10 Emma moved the melon to the green_bucket. +11 Emma exited the porch. +12 Isla moved the melon to the green_bathtub. +13 Isla exited the porch. +14 William, Lily, Aiden, Emma and Isla entered the waiting_room. +15 Emma, Isla and Aiden entered the basement. +16 The watermelon is in the blue_suitcase. +17 Emma made no movements and stayed in the basement for 1 minute. +18 Emma exited the basement. +19 Isla moved the watermelon to the blue_bottle. +20 Isla exited the basement. +21 Aiden made no movements and stayed in the basement for 1 minute. +22 Aiden exited the basement. +23 Emma, Isla and Aiden entered the waiting_room. +24 Aiden likes the red_pantry. +25 William, Isla, Aiden and Lily entered the front_yard. +26 The beans is in the red_bottle. +27 William made no movements and stayed in the front_yard for 1 minute. +28 Isla likes the green_cupboard. +29 William exited the front_yard. +30 Isla moved the beans to the green_bottle. +31 Isla exited the front_yard. +32 Aiden made no movements and stayed in the front_yard for 1 minute. +33 Aiden exited the front_yard. +34 Lily made no movements and stayed in the front_yard for 1 minute. +35 Lily exited the front_yard. +36 William, Isla, Aiden and Lily entered the waiting_room. +Question: Where does Isla think Emma thinks Lily thinks William thinks the melon is? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_cupboard, C. green_bucket, D. blue_pantry, E. green_basket, F. blue_suitcase, G. green_box, H. red_pantry, I. blue_bottle, J. red_container, K. blue_bathtub, L. red_bottle, M. green_bottle, N. red_bucket, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: I. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_12/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..dc638d9a9e8684c57e856702b05b63b3d091fd29 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_12/order_0.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where is the beans really? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: A. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_12/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5af401dea54769edb24b8ba45370e543bfb5e2be --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_12/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Jack really think the beans is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: E. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_12/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4fe0b08508f28e17dae2e80d91580bbcecad3fa1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_12/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Owen think Jack thinks the beans is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: E. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_12/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e7aaf70f2ca04c2631449199689e16819c6773b0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_12/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Liam think Owen thinks Jack thinks the beans is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: E. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_12/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0621d3aeee97168c8ed397cac62e7e5c76f22fdd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_12/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Liam, Jack, Jackson and Benjamin entered the hall. +2 The beans is in the blue_suitcase. +3 Owen made no movements and stayed in the hall for 1 minute. +4 Owen exited the hall. +5 Liam made no movements and stayed in the hall for 1 minute. +6 Liam exited the hall. +7 Jack moved the beans to the green_treasure_chest. +8 Jack exited the hall. +9 Jackson made no movements and stayed in the hall for 1 minute. +10 Jackson exited the hall. +11 Benjamin moved the beans to the blue_suitcase. +12 Benjamin exited the hall. +13 Owen, Liam, Jack, Jackson and Benjamin entered the waiting_room. +14 Owen, Jack and Jackson entered the workshop. +15 The cherry is in the red_basket. +16 Owen made no movements and stayed in the workshop for 1 minute. +17 Owen exited the workshop. +18 Jack made no movements and stayed in the workshop for 1 minute. +19 Jack exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Owen, Jack and Jackson entered the waiting_room. +23 Owen, Jack, Benjamin and Jackson entered the hall. +24 The beans is in the blue_suitcase. +25 Owen made no movements and stayed in the hall for 1 minute. +26 Owen likes the blue_bathtub. +27 Owen exited the hall. +28 Jack made no movements and stayed in the hall for 1 minute. +29 Jack exited the hall. +30 Benjamin made no movements and stayed in the hall for 1 minute. +31 Benjamin exited the hall. +32 Jackson made no movements and stayed in the hall for 1 minute. +33 Jackson exited the hall. +34 Owen, Jack, Benjamin and Jackson entered the waiting_room. +Question: Where does Benjamin think Liam thinks Owen thinks Jack thinks the beans is? +Answer: blue_suitcase +Choices: A. blue_suitcase, B. green_bathtub, C. blue_bathtub, D. green_envelope, E. green_treasure_chest, F. red_basket, G. blue_bottle, H. blue_cupboard, I. blue_bucket, J. green_bottle, K. red_box, L. red_container, M. green_pantry, N. green_cupboard, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: E. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_13/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d881ec77aed9ab65fd4d3bd5c12052d38a14195a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_13/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where is the corn really? +Answer: green_bottle +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: N. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_13/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b462ade3f4b95191194f9e5ee0f0c728490561b6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_13/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does William really think the corn is? +Answer: green_bathtub +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: M. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_13/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..944312785b96d31eaeec49c07f685f4e43a52801 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_13/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does Emily think William thinks the corn is? +Answer: green_bathtub +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: M. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_13/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f005d745deb9a36b70f1fc2a12002c9169eab877 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_13/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does Emma think Emily thinks William thinks the corn is? +Answer: green_bathtub +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: N. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_13/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5ec53e74005ab02c3a2b0cdc8070db89f479b933 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_13/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Emily, Emma, Isla and Jackson entered the pantry. +2 The corn is in the green_bathtub. +3 William moved the corn to the green_cupboard. +4 Emma likes the blue_crate. +5 William exited the pantry. +6 William dislikes the corn. +7 Emily moved the corn to the red_envelope. +8 Emily exited the pantry. +9 Emma made no movements and stayed in the pantry for 1 minute. +10 Emma exited the pantry. +11 Isla moved the corn to the green_bottle. +12 Isla exited the pantry. +13 Jackson moved the corn to the green_bathtub. +14 Jackson exited the pantry. +15 William, Emily, Emma, Isla and Jackson entered the waiting_room. +16 William, Emily and Isla entered the crawlspace. +17 The asparagus is in the green_bucket. +18 William moved the asparagus to the green_drawer. +19 William lost his watch. +20 William exited the crawlspace. +21 Emily made no movements and stayed in the crawlspace for 1 minute. +22 Emily exited the crawlspace. +23 Isla made no movements and stayed in the crawlspace for 1 minute. +24 Isla exited the crawlspace. +25 William, Emily and Isla entered the waiting_room. +26 William, Isla, Emily and Emma entered the pantry. +27 The corn is in the green_bathtub. +28 William made no movements and stayed in the pantry for 1 minute. +29 William exited the pantry. +30 Isla moved the corn to the green_cupboard. +31 Isla exited the pantry. +32 Emily moved the corn to the blue_crate. +33 Emily saw a mouse. +34 Emily exited the pantry. +35 Emma moved the corn to the green_bottle. +36 Emma exited the pantry. +37 William, Isla, Emily and Emma entered the waiting_room. +Question: Where does Jackson think Emma thinks Emily thinks William thinks the corn is? +Answer: green_bathtub +Choices: A. blue_bottle, B. red_drawer, C. red_bottle, D. blue_container, E. red_bucket, F. green_bucket, G. red_pantry, H. green_drawer, I. blue_treasure_chest, J. green_envelope, K. green_bathtub, L. red_envelope, M. green_cupboard, N. green_bottle, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: N. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_14/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1886b3a90144ccda8ab7df66c8813ed56b4cecd0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_14/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where is the cucumber really? +Answer: red_pantry +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: O. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_14/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c158d699cf4ad08f3107207f567e1b88325474ff --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_14/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Avery really think the cucumber is? +Answer: red_pantry +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: M. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_14/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..abb0db7df4ebbb6685f0e7d69e4771ca6bfd509d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_14/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Abigail think Avery thinks the cucumber is? +Answer: blue_container +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: K. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_14/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8c5bb70e234c174d89054863651d6046d7f802f9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_14/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Hannah think Abigail thinks Avery thinks the cucumber is? +Answer: blue_container +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: K. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_14/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..932e382169a6439a4b3db03dbb0f6dcff966d82b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_14/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Jackson, Hannah, Owen and Avery entered the basement. +2 The cucumber is in the blue_drawer. +3 Abigail moved the cucumber to the blue_container. +4 Abigail exited the basement. +5 Jackson made no movements and stayed in the basement for 1 minute. +6 Jackson exited the basement. +7 Abigail lost his phone. +8 Hannah moved the cucumber to the blue_bathtub. +9 Avery dislikes the plum. +10 Hannah exited the basement. +11 Owen moved the cucumber to the red_pantry. +12 Owen exited the basement. +13 Avery made no movements and stayed in the basement for 1 minute. +14 Avery exited the basement. +15 Abigail, Jackson, Hannah, Owen and Avery entered the waiting_room. +16 Jackson, Abigail and Hannah entered the basement. +17 The carrot is in the blue_bathtub. +18 Jackson moved the carrot to the green_basket. +19 Jackson exited the basement. +20 Abigail made no movements and stayed in the basement for 1 minute. +21 Abigail exited the basement. +22 Hannah moved the carrot to the blue_container. +23 Hannah exited the basement. +24 Jackson, Abigail and Hannah entered the waiting_room. +25 Owen, Hannah, Avery and Jackson entered the basement. +26 The carrot is in the blue_container. +27 Owen moved the carrot to the red_pantry. +28 Owen saw a cat. +29 Owen exited the basement. +30 Hannah moved the carrot to the blue_bathtub. +31 Hannah exited the basement. +32 Avery made no movements and stayed in the basement for 1 minute. +33 Avery exited the basement. +34 Jackson made no movements and stayed in the basement for 1 minute. +35 Owen lost his watch. +36 Jackson exited the basement. +37 Owen, Hannah, Avery and Jackson entered the waiting_room. +Question: Where does Owen think Hannah thinks Abigail thinks Avery thinks the cucumber is? +Answer: blue_container +Choices: A. blue_bottle, B. green_box, C. green_cupboard, D. green_bucket, E. red_box, F. green_bottle, G. red_envelope, H. blue_bucket, I. red_crate, J. blue_pantry, K. blue_bathtub, L. blue_drawer, M. red_pantry, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: M. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_15/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b3952b227401cfa94dcf91dc405ed9c39b6e79d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_15/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where is the sweet_potato really? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_15/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1344c190da7a36338c89066f15a39721310c5425 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_15/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Jacob really think the sweet_potato is? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: B. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_15/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8ef410bb2a5a5acc7e4b4701cfcb558ee5e15465 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_15/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Aiden think Jacob thinks the sweet_potato is? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_15/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ae927c921ffbdcebeefd679ec67a87a2352e2041 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_15/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Mila think Aiden thinks Jacob thinks the sweet_potato is? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_15/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..fbbbef5a2f79a12657538f634c17899dd8111513 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_15/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jacob, Mila, Elizabeth, Aiden and Amelia entered the master_bedroom. +2 The sweet_potato is in the green_bottle. +3 Jacob made no movements and stayed in the master_bedroom for 1 minute. +4 Jacob exited the master_bedroom. +5 Mila made no movements and stayed in the master_bedroom for 1 minute. +6 Mila exited the master_bedroom. +7 Elizabeth made no movements and stayed in the master_bedroom for 1 minute. +8 Elizabeth exited the master_bedroom. +9 Aiden moved the sweet_potato to the blue_bucket. +10 Aiden exited the master_bedroom. +11 Amelia moved the sweet_potato to the green_bottle. +12 Amelia exited the master_bedroom. +13 Jacob, Mila, Elizabeth, Aiden and Amelia entered the waiting_room. +14 Amelia, Mila and Elizabeth entered the crawlspace. +15 The carrot is in the red_pantry. +16 Amelia made no movements and stayed in the crawlspace for 1 minute. +17 Amelia exited the crawlspace. +18 Mila moved the carrot to the green_treasure_chest. +19 Mila exited the crawlspace. +20 Amelia lost his watch. +21 Elizabeth moved the carrot to the blue_pantry. +22 Elizabeth exited the crawlspace. +23 Amelia likes the blue_pantry. +24 Amelia, Mila and Elizabeth entered the waiting_room. +25 Amelia, Jacob, Aiden and Mila entered the office. +26 The peach is in the green_bathtub. +27 Amelia moved the peach to the green_bucket. +28 Amelia exited the office. +29 Jacob moved the peach to the green_drawer. +30 Jacob exited the office. +31 Aiden made no movements and stayed in the office for 1 minute. +32 Aiden exited the office. +33 Mila made no movements and stayed in the office for 1 minute. +34 Mila exited the office. +35 Amelia, Jacob, Aiden and Mila entered the waiting_room. +Question: Where does Elizabeth think Mila thinks Aiden thinks Jacob thinks the sweet_potato is? +Answer: green_bottle +Choices: A. green_crate, B. green_bottle, C. blue_bucket, D. red_drawer, E. blue_container, F. blue_pantry, G. red_pantry, H. green_treasure_chest, I. red_bucket, J. blue_treasure_chest, K. blue_crate, L. green_bathtub, M. blue_cupboard, N. green_bucket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: F. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_16/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b83ae9caf2af7b1878cea05d48c0f937bd5e1a18 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_16/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where is the persimmon really? +Answer: red_basket +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: N. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_16/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e80b88b3b9feecce761affedcb6c54bd7069624e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_16/order_1.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does William really think the persimmon is? +Answer: red_basket +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: J. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_16/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..fff19e4e0666b2015063f3794a8e8bd901508ad1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_16/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does Hannah think William thinks the persimmon is? +Answer: blue_crate +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: G. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_16/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..aa8fb998fcc814fd3cd43022d365d55e9794c928 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_16/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does Avery think Hannah thinks William thinks the persimmon is? +Answer: blue_crate +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: G. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_16/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..aaabffa3274ae3f39f756c360ae71a54d4d8ed5e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_16/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Alexander, Carter, Avery and William entered the bedroom. +2 The persimmon is in the red_basket. +3 Hannah moved the persimmon to the blue_crate. +4 Hannah exited the bedroom. +5 Alexander made no movements and stayed in the bedroom for 1 minute. +6 Alexander exited the bedroom. +7 Carter moved the persimmon to the green_basket. +8 Carter exited the bedroom. +9 Avery made no movements and stayed in the bedroom for 1 minute. +10 Avery exited the bedroom. +11 William moved the persimmon to the red_basket. +12 William exited the bedroom. +13 Hannah, Alexander, Carter, Avery and William entered the waiting_room. +14 William, Alexander and Hannah entered the bathroom. +15 The banana is in the red_bucket. +16 William moved the banana to the red_crate. +17 William exited the bathroom. +18 Alexander made no movements and stayed in the bathroom for 1 minute. +19 Alexander exited the bathroom. +20 Hannah made no movements and stayed in the bathroom for 1 minute. +21 Hannah exited the bathroom. +22 William, Alexander and Hannah entered the waiting_room. +23 Alexander, Avery, William and Hannah entered the garage. +24 The plum is in the red_drawer. +25 Alexander moved the plum to the green_cupboard. +26 Alexander exited the garage. +27 Avery moved the plum to the blue_treasure_chest. +28 Avery exited the garage. +29 William moved the plum to the green_bottle. +30 William exited the garage. +31 Hannah moved the plum to the blue_bathtub. +32 Hannah exited the garage. +33 Alexander, Avery, William and Hannah entered the waiting_room. +Question: Where does Alexander think Avery thinks Hannah thinks William thinks the persimmon is? +Answer: blue_crate +Choices: A. red_crate, B. red_bucket, C. red_box, D. blue_bucket, E. green_box, F. red_basket, G. blue_crate, H. green_bathtub, I. green_envelope, J. green_basket, K. red_drawer, L. green_bottle, M. blue_bathtub, N. blue_treasure_chest, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: N. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_17/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..989d4c7e4407f92bc01a7fa228142ae1de24a46e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_17/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where is the eggplant really? +Answer: green_pantry +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: J. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_17/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fe595988cfcd1c539d07d20564056e59341869f8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_17/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Emma really think the eggplant is? +Answer: green_pantry +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: H. green_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_17/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..bec484e32222531d012ea1e67b92eea0b0730bef --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_17/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Jackson think Emma thinks the eggplant is? +Answer: green_box +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: G. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_17/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c2ed16db92f6447d71083e824f0d52d56661dfd5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_17/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Jack think Jackson thinks Emma thinks the eggplant is? +Answer: green_box +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: H. green_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_17/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ef41b6e2df6470c080807a7a41756de9da9f928f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_17/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Avery, Emma, Jack and Jackson entered the garage. +2 The eggplant is in the green_pantry. +3 Emily moved the eggplant to the blue_drawer. +4 Emily exited the garage. +5 Avery made no movements and stayed in the garage for 1 minute. +6 Avery exited the garage. +7 Emma moved the eggplant to the green_box. +8 Emma exited the garage. +9 Jack made no movements and stayed in the garage for 1 minute. +10 Jack exited the garage. +11 Jackson made no movements and stayed in the garage for 1 minute. +12 Jackson exited the garage. +13 Emily, Avery, Emma, Jack and Jackson entered the waiting_room. +14 Emma, Emily and Jack entered the garage. +15 The eggplant is in the green_box. +16 Emma made no movements and stayed in the garage for 1 minute. +17 Emma exited the garage. +18 Emily moved the eggplant to the green_bottle. +19 Emily exited the garage. +20 Jack moved the eggplant to the green_pantry. +21 Jack exited the garage. +22 Emma, Emily and Jack entered the waiting_room. +23 Emily, Avery, Jack and Emma entered the garage. +24 The cherry is in the blue_drawer. +25 Emily moved the cherry to the green_box. +26 Jack likes the green_envelope. +27 Emily exited the garage. +28 Avery moved the cherry to the green_pantry. +29 Avery exited the garage. +30 Jack moved the cherry to the blue_cupboard. +31 Emily saw a monkey. +32 Jack exited the garage. +33 Emma moved the cherry to the green_bottle. +34 Emma exited the garage. +35 Emily, Avery, Jack and Emma entered the waiting_room. +Question: Where does Emily think Jack thinks Jackson thinks Emma thinks the eggplant is? +Answer: green_box +Choices: A. green_basket, B. blue_container, C. green_envelope, D. blue_suitcase, E. blue_bathtub, F. blue_drawer, G. green_pantry, H. green_box, I. blue_cupboard, J. green_bottle, K. green_drawer, L. red_crate, M. blue_crate, N. red_bottle, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: H. green_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_18/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0bb510f88ba6659b5e97fc07f9fcb7db868cc3d9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_18/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where is the lime really? +Answer: blue_crate +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: O. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_18/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7543e6cde21569141ec793f5f773262e7bdc39b2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_18/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Elizabeth really think the lime is? +Answer: green_pantry +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: N. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_18/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..239ea4fe58cdd26793490e9ef3ed4e3f107ae1c9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_18/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Alexander think Elizabeth thinks the lime is? +Answer: green_pantry +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: N. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_18/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c54d9c4f1a03033a0eccb06003cbd693bb87f5a9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_18/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Owen think Alexander thinks Elizabeth thinks the lime is? +Answer: green_pantry +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: O. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_18/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f0987043ca835c2a728ace9d9b70d30590f2e3a1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_18/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth, Alexander, Nathan, Owen and Jackson entered the cellar. +2 Jackson lost his watch. +3 The lime is in the blue_crate. +4 Elizabeth moved the lime to the green_pantry. +5 Elizabeth exited the cellar. +6 Nathan saw a monkey. +7 Alexander made no movements and stayed in the cellar for 1 minute. +8 Alexander exited the cellar. +9 Nathan moved the lime to the green_basket. +10 Nathan exited the cellar. +11 Owen moved the lime to the red_box. +12 Owen exited the cellar. +13 Jackson moved the lime to the blue_crate. +14 Jackson exited the cellar. +15 Elizabeth, Alexander, Nathan, Owen and Jackson entered the waiting_room. +16 Nathan, Jackson and Elizabeth entered the workshop. +17 The sweet_potato is in the blue_suitcase. +18 Nathan made no movements and stayed in the workshop for 1 minute. +19 Nathan exited the workshop. +20 Jackson made no movements and stayed in the workshop for 1 minute. +21 Jackson exited the workshop. +22 Elizabeth made no movements and stayed in the workshop for 1 minute. +23 Elizabeth exited the workshop. +24 Nathan, Jackson and Elizabeth entered the waiting_room. +25 Elizabeth, Owen, Alexander and Nathan entered the workshop. +26 The plum is in the green_box. +27 Elizabeth made no movements and stayed in the workshop for 1 minute. +28 Elizabeth exited the workshop. +29 Owen moved the plum to the red_basket. +30 Jackson likes the blue_suitcase. +31 Owen exited the workshop. +32 Alexander lost his phone. +33 Alexander moved the plum to the red_drawer. +34 Alexander exited the workshop. +35 Nathan moved the plum to the green_cupboard. +36 Nathan exited the workshop. +37 Elizabeth, Owen, Alexander and Nathan entered the waiting_room. +Question: Where does Nathan think Owen thinks Alexander thinks Elizabeth thinks the lime is? +Answer: green_pantry +Choices: A. green_box, B. blue_suitcase, C. red_drawer, D. red_basket, E. green_cupboard, F. red_crate, G. blue_pantry, H. green_crate, I. green_bathtub, J. blue_drawer, K. blue_bucket, L. blue_crate, M. green_basket, N. green_pantry, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: N. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_19/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5a4d0362c943344760c5d7c8659df7e046827151 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_19/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where is the pear really? +Answer: blue_crate +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: N. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_19/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e3f37c6f7abc5a91da5f0855608e5aa050ac8ae2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_19/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does Noah really think the pear is? +Answer: blue_crate +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_19/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..777bc11d408d7634a2ef451cd799b72c2ec43919 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_19/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does William think Noah thinks the pear is? +Answer: green_crate +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: M. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_19/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a6f0b8eec274c0b21c02fcf688e3f6348b2ffe3a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_19/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does Isabella think William thinks Noah thinks the pear is? +Answer: blue_crate +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: M. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_19/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d32b1d2ae8533dd8dea296f001114689cabef7d8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_19/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Jack, William, Noah and Aiden entered the playroom. +2 The pear is in the blue_crate. +3 Isabella made no movements and stayed in the playroom for 1 minute. +4 Isabella exited the playroom. +5 William dislikes the peas. +6 Jack moved the pear to the blue_drawer. +7 Aiden lost his watch. +8 Jack exited the playroom. +9 William moved the pear to the green_crate. +10 William exited the playroom. +11 Noah moved the pear to the blue_suitcase. +12 Noah exited the playroom. +13 Noah saw a mouse. +14 Aiden moved the pear to the blue_crate. +15 Aiden exited the playroom. +16 Isabella, Jack, William, Noah and Aiden entered the waiting_room. +17 Noah, Jack and William entered the dining_room. +18 The peas is in the green_drawer. +19 Noah moved the peas to the blue_pantry. +20 Noah exited the dining_room. +21 Jack moved the peas to the red_pantry. +22 Jack exited the dining_room. +23 William made no movements and stayed in the dining_room for 1 minute. +24 William exited the dining_room. +25 Noah, Jack and William entered the waiting_room. +26 Isabella, Noah, Jack and Aiden entered the playroom. +27 The lemon is in the blue_suitcase. +28 Isabella moved the lemon to the green_basket. +29 Isabella exited the playroom. +30 Noah made no movements and stayed in the playroom for 1 minute. +31 Noah exited the playroom. +32 Jack moved the lemon to the blue_crate. +33 Jack exited the playroom. +34 Aiden made no movements and stayed in the playroom for 1 minute. +35 Noah lost his phone. +36 Aiden exited the playroom. +37 Isabella, Noah, Jack and Aiden entered the waiting_room. +Question: Where does Aiden think Isabella thinks William thinks Noah thinks the pear is? +Answer: blue_crate +Choices: A. red_pantry, B. green_drawer, C. blue_pantry, D. blue_bucket, E. green_box, F. green_bathtub, G. red_bottle, H. red_crate, I. red_envelope, J. blue_cupboard, K. blue_suitcase, L. blue_crate, M. green_crate, N. blue_drawer, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: M. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_2/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c619707c25ce772d4c8bc45502c2697a8dc22143 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_2/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where is the onion really? +Answer: blue_bottle +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bottle +GPT-4 Explain: O. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_2/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6915c9555e400c42c7633f7c2026bd48613d03ae --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_2/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Nathan really think the onion is? +Answer: blue_bottle +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bottle +GPT-4 Explain: N. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_2/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..48cf99504ba9da4f018c668c25f8bdae6f326ba1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_2/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Emily think Nathan thinks the onion is? +Answer: blue_container +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: N. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_2/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..3430e7fc1a2a817e6070576294956fa664ccdedd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_2/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Owen think Emily thinks Nathan thinks the onion is? +Answer: blue_container +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: O. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_2/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d24d499e9064e1507cab827945583fcf6b4f2507 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_2/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Charlotte, Owen, Nathan and Liam entered the attic. +2 The onion is in the blue_treasure_chest. +3 Emily made no movements and stayed in the attic for 1 minute. +4 Emily exited the attic. +5 Charlotte moved the onion to the green_treasure_chest. +6 Charlotte exited the attic. +7 Owen moved the onion to the red_drawer. +8 Owen exited the attic. +9 Nathan made no movements and stayed in the attic for 1 minute. +10 Nathan exited the attic. +11 Liam made no movements and stayed in the attic for 1 minute. +12 Liam exited the attic. +13 Nathan lost his gloves. +14 Emily, Charlotte, Owen, Nathan and Liam entered the waiting_room. +15 Emily, Charlotte and Liam entered the front_yard. +16 The lemon is in the red_bottle. +17 Emily moved the lemon to the blue_container. +18 Charlotte likes the red_bottle. +19 Emily exited the front_yard. +20 Charlotte moved the lemon to the blue_crate. +21 Charlotte exited the front_yard. +22 Liam moved the lemon to the green_drawer. +23 Emily likes the red_envelope. +24 Liam exited the front_yard. +25 Emily, Charlotte and Liam entered the waiting_room. +26 Nathan dislikes the eggplant. +27 Charlotte, Owen, Liam and Nathan entered the attic. +28 The onion is in the red_drawer. +29 Charlotte made no movements and stayed in the attic for 1 minute. +30 Charlotte exited the attic. +31 Owen moved the onion to the blue_bottle. +32 Owen exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Liam saw a dog. +36 Nathan made no movements and stayed in the attic for 1 minute. +37 Nathan exited the attic. +38 Charlotte, Owen, Liam and Nathan entered the waiting_room. +Question: Where does Liam think Owen thinks Emily thinks Nathan thinks the onion is? +Answer: blue_container +Choices: A. green_bathtub, B. red_pantry, C. green_bottle, D. red_envelope, E. green_pantry, F. red_bottle, G. green_drawer, H. blue_container, I. blue_drawer, J. blue_crate, K. blue_treasure_chest, L. blue_bucket, M. green_treasure_chest, N. red_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: O. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_20/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2ef071a21475f66d91823806bc57d8cd194c5503 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_20/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where is the spinach really? +Answer: blue_treasure_chest +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: O. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_20/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7adba22522e0c5101f14afd972c2e514cd58ca57 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_20/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Evelyn really think the spinach is? +Answer: blue_treasure_chest +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: M. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_20/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..130931a6aefd21f6af087a6958aa0ab2f655960c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_20/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Jackson think Evelyn thinks the spinach is? +Answer: green_cupboard +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_cupboard +GPT-4 Explain: M. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_20/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..44332d517dd3cd9e823d4c0c04287a1c00559941 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_20/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Liam think Jackson thinks Evelyn thinks the spinach is? +Answer: green_drawer +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_20/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..01c6a2c662daa00e7fc19f7be0e37ab7e64e9378 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_20/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Elizabeth, Evelyn, Liam and Noah entered the living_room. +2 The spinach is in the green_drawer. +3 Jackson made no movements and stayed in the living_room for 1 minute. +4 Jackson exited the living_room. +5 Elizabeth moved the spinach to the green_pantry. +6 Elizabeth exited the living_room. +7 Evelyn moved the spinach to the red_container. +8 Evelyn lost his phone. +9 Evelyn exited the living_room. +10 Liam made no movements and stayed in the living_room for 1 minute. +11 Liam exited the living_room. +12 Noah moved the spinach to the green_drawer. +13 Noah exited the living_room. +14 Elizabeth lost his watch. +15 Jackson, Elizabeth, Evelyn, Liam and Noah entered the waiting_room. +16 Liam, Jackson and Evelyn entered the dining_room. +17 The sweet_potato is in the red_crate. +18 Liam moved the sweet_potato to the blue_bucket. +19 Evelyn saw a cat. +20 Liam exited the dining_room. +21 Jackson moved the sweet_potato to the blue_container. +22 Jackson exited the dining_room. +23 Evelyn made no movements and stayed in the dining_room for 1 minute. +24 Evelyn exited the dining_room. +25 Liam, Jackson and Evelyn entered the waiting_room. +26 Liam, Jackson, Elizabeth and Evelyn entered the living_room. +27 The spinach is in the green_drawer. +28 Liam made no movements and stayed in the living_room for 1 minute. +29 Liam exited the living_room. +30 Jackson moved the spinach to the green_cupboard. +31 Jackson likes the blue_bathtub. +32 Jackson exited the living_room. +33 Elizabeth moved the spinach to the blue_treasure_chest. +34 Elizabeth exited the living_room. +35 Evelyn made no movements and stayed in the living_room for 1 minute. +36 Evelyn exited the living_room. +37 Evelyn likes the green_pantry. +38 Liam, Jackson, Elizabeth and Evelyn entered the waiting_room. +Question: Where does Elizabeth think Liam thinks Jackson thinks Evelyn thinks the spinach is? +Answer: green_drawer +Choices: A. green_envelope, B. red_pantry, C. blue_bathtub, D. green_crate, E. blue_drawer, F. red_crate, G. red_bottle, H. green_treasure_chest, I. blue_container, J. blue_bucket, K. blue_treasure_chest, L. green_drawer, M. green_pantry, N. red_container, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: O. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_3/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9a1ea13d7a65bac4f9b1857cd46a3ad6616e4ac2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_3/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where is the peas really? +Answer: blue_cupboard +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: J. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_3/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c6ba97b26f706f9a31c29c24a465f9ce27afda28 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_3/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Isla really think the peas is? +Answer: blue_cupboard +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: B. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_3/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..07a50482beec18316ed9d97d0dc2e614d861aea9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_3/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Amelia think Isla thinks the peas is? +Answer: green_bucket +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: J. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_3/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..177409241c294f9954d86a59aa4b34a9dafdd9ca --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_3/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Carter think Amelia thinks Isla thinks the peas is? +Answer: green_bucket +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: J. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_3/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8a38c1b00fb17d9c411ed18b0519be66142a2b57 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_3/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Carter, Isla, Amelia and Emma entered the staircase. +2 The peas is in the green_treasure_chest. +3 Mila moved the peas to the blue_bucket. +4 Mila exited the staircase. +5 Carter moved the peas to the green_bucket. +6 Carter exited the staircase. +7 Isla made no movements and stayed in the staircase for 1 minute. +8 Isla exited the staircase. +9 Amelia dislikes the spinach. +10 Amelia moved the peas to the blue_cupboard. +11 Amelia exited the staircase. +12 Emma made no movements and stayed in the staircase for 1 minute. +13 Emma exited the staircase. +14 Mila, Carter, Isla, Amelia and Emma entered the waiting_room. +15 Amelia, Carter and Isla entered the staircase. +16 Mila likes the red_basket. +17 The watermelon is in the blue_bucket. +18 Amelia made no movements and stayed in the staircase for 1 minute. +19 Amelia exited the staircase. +20 Carter moved the watermelon to the green_bucket. +21 Carter exited the staircase. +22 Isla made no movements and stayed in the staircase for 1 minute. +23 Isla exited the staircase. +24 Amelia, Carter and Isla entered the waiting_room. +25 Emma, Amelia, Isla and Carter entered the study. +26 The lemon is in the red_basket. +27 Emma made no movements and stayed in the study for 1 minute. +28 Emma exited the study. +29 Amelia made no movements and stayed in the study for 1 minute. +30 Amelia exited the study. +31 Isla moved the lemon to the green_cupboard. +32 Isla exited the study. +33 Carter made no movements and stayed in the study for 1 minute. +34 Carter exited the study. +35 Emma, Amelia, Isla and Carter entered the waiting_room. +Question: Where does Mila think Carter thinks Amelia thinks Isla thinks the peas is? +Answer: blue_bucket +Choices: A. green_treasure_chest, B. blue_bucket, C. green_bucket, D. red_envelope, E. blue_cupboard, F. red_basket, G. green_crate, H. green_pantry, I. green_bathtub, J. green_cupboard, K. red_drawer, L. green_envelope, M. blue_treasure_chest, N. red_bucket, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bucket +GPT-4 Explain: J. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_4/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c371b5e8300e507c62de1512b33e15f2846f1460 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_4/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where is the green_pepper really? +Answer: blue_container +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: C. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_4/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6bd57ed2fd8726515f751ce507b067d30308e020 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_4/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Emma really think the green_pepper is? +Answer: blue_container +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: G. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_4/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f16a109dcbf3cd7b97792e7919d98da0bdece12e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_4/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Benjamin think Emma thinks the green_pepper is? +Answer: blue_container +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: G. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_4/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..10ddb560343153722bd064dd6f15f8636b6e57fc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_4/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Jackson think Benjamin thinks Emma thinks the green_pepper is? +Answer: blue_container +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: C. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_4/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a977fb30144f7e44bee97f5dd0da85e7fe34dc7f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_4/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jackson, Emma, Abigail, Logan and Benjamin entered the living_room. +2 The green_pepper is in the red_basket. +3 Jackson moved the green_pepper to the blue_container. +4 Jackson exited the living_room. +5 Benjamin saw a cat. +6 Emma made no movements and stayed in the living_room for 1 minute. +7 Emma exited the living_room. +8 Abigail made no movements and stayed in the living_room for 1 minute. +9 Abigail exited the living_room. +10 Logan made no movements and stayed in the living_room for 1 minute. +11 Abigail dislikes the grapes. +12 Logan exited the living_room. +13 Benjamin made no movements and stayed in the living_room for 1 minute. +14 Benjamin exited the living_room. +15 Jackson, Emma, Abigail, Logan and Benjamin entered the waiting_room. +16 Emma likes the blue_bottle. +17 Benjamin, Emma and Abigail entered the bedroom. +18 The grapes is in the red_bottle. +19 Benjamin moved the grapes to the green_bathtub. +20 Benjamin exited the bedroom. +21 Emma made no movements and stayed in the bedroom for 1 minute. +22 Logan dislikes the green_pepper. +23 Emma exited the bedroom. +24 Abigail made no movements and stayed in the bedroom for 1 minute. +25 Abigail exited the bedroom. +26 Benjamin, Emma and Abigail entered the waiting_room. +27 Abigail, Emma, Jackson and Logan entered the dining_room. +28 The watermelon is in the blue_drawer. +29 Abigail made no movements and stayed in the dining_room for 1 minute. +30 Abigail exited the dining_room. +31 Emma made no movements and stayed in the dining_room for 1 minute. +32 Emma exited the dining_room. +33 Jackson moved the watermelon to the green_cupboard. +34 Jackson exited the dining_room. +35 Logan moved the watermelon to the red_container. +36 Logan exited the dining_room. +37 Abigail, Emma, Jackson and Logan entered the waiting_room. +Question: Where does Abigail think Jackson thinks Benjamin thinks Emma thinks the green_pepper is? +Answer: blue_container +Choices: A. blue_bottle, B. blue_drawer, C. green_cupboard, D. red_container, E. blue_treasure_chest, F. red_basket, G. blue_container, H. red_box, I. blue_cupboard, J. red_crate, K. red_bottle, L. green_basket, M. green_bottle, N. green_bucket, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: C. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_5/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c31117aa6fab869137cce3c95d79c6317f4cf6d5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_5/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where is the peas really? +Answer: blue_bathtub +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: L. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_5/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..34a5cbb0e87d49393c3b1c0e2c584fe6529dfdbf --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_5/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Hannah really think the peas is? +Answer: blue_bathtub +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: H. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_5/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..be06d214a17c11fa5785eda7a2cf0e088729588d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_5/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Amelia think Hannah thinks the peas is? +Answer: green_basket +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: L. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_5/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5a6bc7c7c14caa00599cbe0da6bcf7f36b13419e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_5/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Jackson think Amelia thinks Hannah thinks the peas is? +Answer: green_basket +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: N. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_5/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1fade1cac746e04175d6834b364761061afeb19c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_5/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Amelia, Jackson, Hannah and Abigail entered the patio. +2 The peas is in the green_basket. +3 Mila made no movements and stayed in the patio for 1 minute. +4 Mila exited the patio. +5 Amelia made no movements and stayed in the patio for 1 minute. +6 Amelia exited the patio. +7 Jackson made no movements and stayed in the patio for 1 minute. +8 Jackson exited the patio. +9 Jackson likes the green_bathtub. +10 Hannah moved the peas to the blue_bathtub. +11 Hannah exited the patio. +12 Abigail made no movements and stayed in the patio for 1 minute. +13 Abigail exited the patio. +14 Mila, Amelia, Jackson, Hannah and Abigail entered the waiting_room. +15 Hannah, Amelia and Mila entered the lounge. +16 The lemon is in the blue_cupboard. +17 Hannah moved the lemon to the red_envelope. +18 Hannah exited the lounge. +19 Amelia moved the lemon to the blue_container. +20 Amelia exited the lounge. +21 Jackson dislikes the beans. +22 Mila moved the lemon to the green_box. +23 Hannah likes the green_crate. +24 Mila exited the lounge. +25 Hannah, Amelia and Mila entered the waiting_room. +26 Hannah, Abigail, Mila and Jackson entered the closet. +27 The sweet_potato is in the red_bucket. +28 Hannah moved the sweet_potato to the green_cupboard. +29 Hannah exited the closet. +30 Abigail made no movements and stayed in the closet for 1 minute. +31 Abigail exited the closet. +32 Mila made no movements and stayed in the closet for 1 minute. +33 Mila exited the closet. +34 Jackson made no movements and stayed in the closet for 1 minute. +35 Jackson exited the closet. +36 Hannah, Abigail, Mila and Jackson entered the waiting_room. +Question: Where does Abigail think Jackson thinks Amelia thinks Hannah thinks the peas is? +Answer: green_basket +Choices: A. blue_pantry, B. red_bucket, C. green_cupboard, D. green_crate, E. red_basket, F. green_box, G. blue_cupboard, H. red_envelope, I. blue_container, J. red_drawer, K. green_bucket, L. green_basket, M. red_pantry, N. green_bathtub, O. blue_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: L. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_6/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9cd666acefdedbb54146d4bb87d72c7c5922ab0e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_6/order_0.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where is the turnip really? +Answer: blue_pantry +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: C. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_6/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c1d0782f1607db4f3a4a3543dd90e60007bf3d52 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_6/order_1.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Hannah really think the turnip is? +Answer: blue_pantry +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: C. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_6/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..49ae36d845d537fc9cb036de3d5d2d33e9c0319a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_6/order_2.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Lily think Hannah thinks the turnip is? +Answer: red_basket +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: C. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_6/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8230fbfc0d7cd5b63a39ebe68354f18ccb2ffe12 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_6/order_3.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Noah think Lily thinks Hannah thinks the turnip is? +Answer: red_basket +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: C. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_6/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..31005a65a76d75420c1ffefd22a9bc1543e23478 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_6/order_4.txt @@ -0,0 +1,45 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Lily, Logan, Elizabeth and Noah entered the study. +2 The turnip is in the red_basket. +3 Hannah made no movements and stayed in the study for 1 minute. +4 Hannah exited the study. +5 Lily made no movements and stayed in the study for 1 minute. +6 Lily exited the study. +7 Logan made no movements and stayed in the study for 1 minute. +8 Lily dislikes the onion. +9 Logan exited the study. +10 Elizabeth moved the turnip to the green_pantry. +11 Elizabeth exited the study. +12 Noah moved the turnip to the red_basket. +13 Noah exited the study. +14 Logan lost his watch. +15 Hannah, Lily, Logan, Elizabeth and Noah entered the waiting_room. +16 Noah, Logan and Hannah entered the dining_room. +17 The sweet_potato is in the blue_suitcase. +18 Noah moved the sweet_potato to the red_envelope. +19 Noah exited the dining_room. +20 Logan moved the sweet_potato to the green_drawer. +21 Logan exited the dining_room. +22 Hannah made no movements and stayed in the dining_room for 1 minute. +23 Hannah exited the dining_room. +24 Noah, Logan and Hannah entered the waiting_room. +25 Noah, Lily, Hannah and Elizabeth entered the study. +26 The turnip is in the red_basket. +27 Noah dislikes the cabbage. +28 Noah made no movements and stayed in the study for 1 minute. +29 Noah exited the study. +30 Lily made no movements and stayed in the study for 1 minute. +31 Lily exited the study. +32 Hannah moved the turnip to the blue_pantry. +33 Hannah exited the study. +34 Elizabeth made no movements and stayed in the study for 1 minute. +35 Elizabeth exited the study. +36 Noah, Lily, Hannah and Elizabeth entered the waiting_room. +Question: Where does Logan think Noah thinks Lily thinks Hannah thinks the turnip is? +Answer: green_drawer +Choices: A. red_basket, B. green_crate, C. blue_pantry, D. green_pantry, E. red_bucket, F. green_box, G. green_basket, H. blue_drawer, I. blue_bucket, J. red_drawer, K. blue_suitcase, L. red_envelope, M. green_drawer, N. red_crate, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: K. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_7/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc9c8fdb58b7d328463f876517fef18b47a63223 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_7/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where is the watermelon really? +Answer: red_bottle +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bottle +GPT-4 Explain: K. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_7/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..94e2c897281eeac913fce049bc0ec71cf198f404 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_7/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Evelyn really think the watermelon is? +Answer: green_cupboard +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_cupboard +GPT-4 Explain: L. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_7/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5323243bf5a753d245cb039c86bc064b6d8982dd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_7/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Logan think Evelyn thinks the watermelon is? +Answer: green_cupboard +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_cupboard +GPT-4 Explain: K. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_7/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7ab8d75f700ba471b73c2505bb189dcdb4d2af8b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_7/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Chloe think Logan thinks Evelyn thinks the watermelon is? +Answer: green_cupboard +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_cupboard +GPT-4 Explain: K \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_7/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3b8df7612964ff56689a757e46e29d3c908647ce --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_7/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Evelyn, Chloe, Charlotte, Logan and Mila entered the staircase. +2 Chloe lost his gloves. +3 The watermelon is in the green_cupboard. +4 Evelyn made no movements and stayed in the staircase for 1 minute. +5 Chloe lost his watch. +6 Evelyn exited the staircase. +7 Chloe made no movements and stayed in the staircase for 1 minute. +8 Chloe exited the staircase. +9 Charlotte made no movements and stayed in the staircase for 1 minute. +10 Charlotte exited the staircase. +11 Logan made no movements and stayed in the staircase for 1 minute. +12 Logan exited the staircase. +13 Mila moved the watermelon to the green_cupboard. +14 Mila exited the staircase. +15 Evelyn, Chloe, Charlotte, Logan and Mila entered the waiting_room. +16 Charlotte, Logan and Chloe entered the staircase. +17 The lemon is in the red_pantry. +18 Charlotte made no movements and stayed in the staircase for 1 minute. +19 Charlotte exited the staircase. +20 Logan made no movements and stayed in the staircase for 1 minute. +21 Logan exited the staircase. +22 Chloe moved the lemon to the green_cupboard. +23 Chloe exited the staircase. +24 Charlotte, Logan and Chloe entered the waiting_room. +25 Evelyn, Mila, Logan and Chloe entered the staircase. +26 The watermelon is in the green_cupboard. +27 Evelyn made no movements and stayed in the staircase for 1 minute. +28 Evelyn exited the staircase. +29 Mila made no movements and stayed in the staircase for 1 minute. +30 Mila exited the staircase. +31 Logan moved the watermelon to the red_bottle. +32 Logan exited the staircase. +33 Chloe made no movements and stayed in the staircase for 1 minute. +34 Chloe exited the staircase. +35 Evelyn, Mila, Logan and Chloe entered the waiting_room. +Question: Where does Charlotte think Chloe thinks Logan thinks Evelyn thinks the watermelon is? +Answer: green_cupboard +Choices: A. green_box, B. blue_drawer, C. red_container, D. red_basket, E. blue_treasure_chest, F. green_drawer, G. blue_crate, H. green_pantry, I. blue_pantry, J. blue_bucket, K. red_pantry, L. green_cupboard, M. red_bottle, N. green_envelope, O. green_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_cupboard +GPT-4 Explain: K. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_8/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f55a9fa2af01756d91e3dd4e897b05b0b3b88423 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_8/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where is the lemon really? +Answer: green_drawer +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: N. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_8/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..474aa79337ab8ef500b0c7f01d95934458201056 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_8/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Aiden really think the lemon is? +Answer: green_basket +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: O. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_8/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..56b7082a47816747a82c19afaefb582cef95cddb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_8/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Nathan think Aiden thinks the lemon is? +Answer: green_basket +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: O. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_8/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e69a63c71e4a1de2b802989b4c2b124b4d6cdb48 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_8/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Jack think Nathan thinks Aiden thinks the lemon is? +Answer: blue_pantry +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: N. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_8/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..479282b608b2cb527bc2e087659c18c3f8aa764e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_8/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Jack, Liam, Aiden, Sophia and Nathan entered the garage. +2 The lemon is in the green_drawer. +3 Jack moved the lemon to the blue_pantry. +4 Jack exited the garage. +5 Liam moved the lemon to the blue_crate. +6 Liam exited the garage. +7 Aiden moved the lemon to the green_basket. +8 Aiden exited the garage. +9 Sophia made no movements and stayed in the garage for 1 minute. +10 Sophia exited the garage. +11 Nathan moved the lemon to the green_drawer. +12 Nathan exited the garage. +13 Jack likes the green_drawer. +14 Jack, Liam, Aiden, Sophia and Nathan entered the waiting_room. +15 Jack, Liam and Nathan entered the garage. +16 The eggplant is in the green_envelope. +17 Jack made no movements and stayed in the garage for 1 minute. +18 Jack exited the garage. +19 Liam made no movements and stayed in the garage for 1 minute. +20 Liam exited the garage. +21 Nathan saw a cat. +22 Nathan moved the eggplant to the blue_crate. +23 Nathan exited the garage. +24 Jack, Liam and Nathan entered the waiting_room. +25 Sophia, Aiden, Liam and Nathan entered the cellar. +26 The cherry is in the red_envelope. +27 Sophia moved the cherry to the green_bottle. +28 Sophia exited the cellar. +29 Liam lost his watch. +30 Aiden moved the cherry to the green_crate. +31 Aiden exited the cellar. +32 Liam made no movements and stayed in the cellar for 1 minute. +33 Jack dislikes the persimmon. +34 Liam exited the cellar. +35 Aiden dislikes the lemon. +36 Nathan made no movements and stayed in the cellar for 1 minute. +37 Nathan exited the cellar. +38 Sophia, Aiden, Liam and Nathan entered the waiting_room. +Question: Where does Liam think Jack thinks Nathan thinks Aiden thinks the lemon is? +Answer: blue_pantry +Choices: A. red_envelope, B. blue_bottle, C. green_bottle, D. green_pantry, E. green_crate, F. red_basket, G. green_cupboard, H. blue_treasure_chest, I. red_box, J. green_bucket, K. green_envelope, L. green_drawer, M. blue_crate, N. blue_pantry, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: N. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_9/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b00dccbae2ee5c7d0288187fa009d42d9014a3f8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_9/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where is the cabbage really? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: F. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_9/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1ffe5e5e6b7f171970bc13aeac712323d7629544 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_9/order_1.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Isla really think the cabbage is? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: F. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_9/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5b6082bc13f94635c9f619448f55004529b61b6d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_9/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Elizabeth think Isla thinks the cabbage is? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: I. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_9/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9c2f54ad2a44fdd7da2ab4e5ba2636a55428746f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_9/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Abigail think Elizabeth thinks Isla thinks the cabbage is? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: I. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_9/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..067a8359fc7768c8eeb4d5c0f0f2410026f01096 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/No_Tell/MC/length_3/sample_9/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isla, Elizabeth, William, Aiden and Abigail entered the playroom. +2 The cabbage is in the blue_bathtub. +3 Abigail likes the green_drawer. +4 Isla made no movements and stayed in the playroom for 1 minute. +5 Isla exited the playroom. +6 Elizabeth made no movements and stayed in the playroom for 1 minute. +7 Elizabeth exited the playroom. +8 William moved the cabbage to the blue_treasure_chest. +9 William exited the playroom. +10 Aiden moved the cabbage to the blue_bottle. +11 Elizabeth likes the green_treasure_chest. +12 Aiden exited the playroom. +13 Abigail made no movements and stayed in the playroom for 1 minute. +14 Abigail exited the playroom. +15 Isla likes the green_bottle. +16 Isla, Elizabeth, William, Aiden and Abigail entered the waiting_room. +17 William, Elizabeth and Isla entered the closet. +18 The lime is in the red_envelope. +19 William moved the lime to the green_bathtub. +20 William exited the closet. +21 Elizabeth made no movements and stayed in the closet for 1 minute. +22 Elizabeth exited the closet. +23 Isla made no movements and stayed in the closet for 1 minute. +24 Isla exited the closet. +25 William, Elizabeth and Isla entered the waiting_room. +26 William, Isla, Aiden and Abigail entered the playroom. +27 Aiden likes the blue_treasure_chest. +28 The cabbage is in the blue_bottle. +29 William made no movements and stayed in the playroom for 1 minute. +30 William exited the playroom. +31 Isla moved the cabbage to the blue_bathtub. +32 Isla exited the playroom. +33 Aiden made no movements and stayed in the playroom for 1 minute. +34 Aiden exited the playroom. +35 Abigail made no movements and stayed in the playroom for 1 minute. +36 Abigail exited the playroom. +37 William, Isla, Aiden and Abigail entered the waiting_room. +Question: Where does Aiden think Abigail thinks Elizabeth thinks Isla thinks the cabbage is? +Answer: blue_bathtub +Choices: A. red_container, B. red_envelope, C. green_bathtub, D. green_box, E. red_crate, F. blue_bathtub, G. blue_drawer, H. blue_treasure_chest, I. green_treasure_chest, J. blue_bottle, K. green_bottle, L. green_bucket, M. green_pantry, N. blue_cupboard, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: H. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_1/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c0aa71d0c3209174b82212407d2a25047497b37f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_1/order_0.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where is the carrot really? +Answer: red_basket +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To solve this question, we need to follow the movements of each agent and their interactions. + +1. William, Jack, Charlotte, Noah, and Hannah entered the hall. +2. Noah saw a monkey. +3. The carrot is in the red_basket. +4. William made no movements and stayed in the hall for 1 minute. +5. William exited the hall. +6. Hannah saw a mouse. +7. Jack made no movements and stayed in the hall for 1 minute. +8. Jack exited the hall. +9. Charlotte made no movements and stayed in the hall for 1 minute. +10. Charlotte exited the hall. +11. Charlotte dislikes the tomato. +12. Noah moved the carrot to the green_envelope. +13. Noah exited the hall. +14. Hannah moved the carrot to the red_basket. +15. Hannah exited the hall. +16. William, Jack, Charlotte, Noah, and Hannah entered the waiting_room. +17. Charlotte publicly claimed that carrot is in the green_envelope. +18. Hannah privately told Charlotte that the carrot is in the blue_container. + +Based on the story and assumptions, we know that Charlotte tends to lie and that Hannah privately told Charlotte that the carrot is in the blue_container. Therefore, we can eliminate the options that Charlotte claimed (green_envelope) and the opposite of what Hannah told her (red_basket). + +We also know that Noah moved the carrot to the green_envelope before exiting the hall, and Hannah moved it to the red_basket after Noah left. Therefore, we can eliminate the options that were not mentioned in the story (blue_container, red_crate, green_drawer, blue_bucket, green_cupboard, red_bottle, green_treasure_chest, blue_cupboard, red_pantry, red_container, blue_bathtub, red_envelope, blue_pantry). + +This leaves us with the option A. green_envelope as the most likely answer. + +a: 7 6 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_1/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5166295de2ae8464450590bcf5993c58824f9edf --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_1/order_1.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does William really think the carrot is? +Answer: green_envelope +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To answer this question, we need to look for any information related to William's thoughts on the location of the carrot. According to the story, William made no movements and stayed in the hall for 1 minute before exiting. There is no other information provided about William's actions or interactions with other agents that could give us a clue about his thoughts on the location of the carrot. Therefore, we cannot determine where William really thinks the carrot is based on the given information. The answer is not provided in the options given. The correct answer is "Cannot be determined." + +a: 5 6 7 9 4 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_1/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..10e3a86c9a15615d7a4eab5847030540d1382960 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_1/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does Hannah think William thinks the carrot is? +Answer: red_basket +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To answer this question, we need to track the movements and interactions of Hannah and William. According to the story, William made no movements in the hall and exited after Hannah. Hannah moved the carrot to the red_basket before exiting the hall. In the waiting room, Charlotte publicly claimed that the carrot is in the green_envelope, and Hannah privately told Charlotte that the carrot is in the blue_container. + +Since Hannah and William were never in the same place, we cannot directly infer what Hannah thinks William thinks about the carrot's location. However, we can make some assumptions based on the given information. Since Hannah moved the carrot to the red_basket before exiting the hall, it is possible that she thinks the carrot is still in the red_basket. William made no movements in the hall, so he may not have seen the carrot or know where it is. However, since William exited the hall after Hannah, she may trust his opinion more than the others who exited before her. + +Therefore, the most likely answer is that Hannah thinks William thinks the carrot is in the red_basket. The correct answer is B. red_basket. + +a: 2 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_1/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..3921a36767033b6b21de7c0498f20a412af8f494 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_1/order_3.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does Jack think Hannah thinks William thinks the carrot is? +Answer: red_basket +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: This question requires a lot of steps to solve. Let's break it down: + +1. We need to determine where Hannah thinks the carrot is. +- According to step 14, Hannah moved the carrot to the red_basket before exiting the hall. +- However, according to step 18, Hannah privately told Charlotte that the carrot is in the blue_container. +- Since we know that agents tend to lie, we cannot trust either of these statements completely. However, we can infer that Hannah thinks the carrot is either in the red_basket or the blue_container. + +2. We need to determine where William thinks the carrot is. +- There is no direct information about where William thinks the carrot is. +- However, since William made no movements and stayed in the hall for 1 minute before exiting, we can assume that he did not move the carrot or see anyone else move it. Therefore, he may not have any idea where the carrot is. + +3. We need to determine where Jack thinks Hannah thinks William thinks the carrot is. +- Since we don't know where William thinks the carrot is, we can ignore that part of the question. +- We know that Jack made no movements and stayed in the hall for 1 minute before exiting. Therefore, he may have seen Hannah move the carrot to the red_basket. +- However, since we also know that agents tend to lie, we cannot trust this completely. +- We also know that Hannah privately told Charlotte that the carrot is in the blue_container. Since Jack did not have a private interaction with Hannah, he would not know this information. +- Therefore, the only information we have to go on is that Jack may have seen Hannah move the carrot to the red_basket. +- However, since we are looking for where Jack thinks Hannah thinks William thinks the carrot is, we need to consider what Jack might think Hannah thinks about William's thoughts. +- Since we don't know where William thinks the carrot is, we cannot determine what Hannah might think about his thoughts. +- Therefore, the best answer we can give is that Jack may think Hannah thinks the carrot is in the red_basket. + +Answer: B. red_basket + +a: 5 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_1/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c1d8b2d12414dd559d1e9f7ddcfbb872bab8f96c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_1/order_4.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does Charlotte think Jack thinks Hannah thinks William thinks the carrot is? +Answer: red_basket +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: This question requires a lot of steps to solve. Let's break it down: + +1. Charlotte publicly claimed that the carrot is in the green_envelope. +2. Hannah privately told Charlotte that the carrot is in the blue_container. +3. Charlotte thinks that Hannah is lying. +4. Therefore, Charlotte thinks that the carrot is not in the blue_container. +5. William made no movements and stayed in the hall for 1 minute. +6. William exited the hall. +7. Jack made no movements and stayed in the hall for 1 minute. +8. Jack exited the hall. +9. Charlotte made no movements and stayed in the hall for 1 minute. +10. Charlotte exited the hall. +11. Therefore, Charlotte trusts Jack more than Hannah or William. +12. Hannah saw a mouse. +13. Therefore, Hannah did not see the monkey that Noah saw. +14. Noah moved the carrot to the green_envelope. +15. Therefore, the carrot is in the green_envelope. +16. Charlotte dislikes the tomato. +17. Therefore, we can eliminate any answer choices that mention a tomato. +18. We know that Charlotte trusts Jack more than Hannah or William, so we can eliminate any answer choices that mention a container that Hannah or William saw. +19. Therefore, the answer is A. green_envelope. + +So, to summarize: Charlotte publicly claimed that the carrot is in the green_envelope. Hannah privately told Charlotte that the carrot is in the blue_container, but Charlotte thinks Hannah is lying. William, Jack, Charlotte, Noah, and Hannah all entered the hall, but only Noah saw the monkey. William, Jack, and Charlotte all stayed in the hall for 1 minute before exiting in that order. Charlotte trusts Jack more than Hannah or William. Noah moved the carrot to the green_envelope. Charlotte dislikes the tomato. Therefore, Charlotte thinks that Jack thinks that the carrot is in the green_envelope. + +a: 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_10/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5e0f8f026f76df4119c17a739e76d50135d5e421 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_10/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where is the potato really? +Answer: green_cupboard +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_cupboard +GPT-4 Explain: To solve this question, we need to track the movements of the potato and the agents. According to the story, the potato was initially in the blue_bathtub, then moved to the blue_pantry by Avery, and then to the green_cupboard by Jacob. + +Later, Jacob publicly claimed that the potato is in the blue_bathtub, but Alexander privately told Jacob that the potato is in the blue_bottle. We need to consider that every agent tends to lie, so we cannot trust Jacob's public claim. + +However, we can infer that Alexander knows the location of the potato since he privately told Jacob that it is in the blue_bottle. We also know that Alexander stayed in the study for one minute, which means he had the opportunity to move the potato. + +Therefore, the correct answer is C. blue_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_10/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4877c263dd4b726a843769e89de138e220404d9c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_10/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Carter really think the potato is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: To solve this question, we need to track Carter's movements and any interactions he had with other agents. According to the story, Carter entered the study with four other agents, made no movements, and stayed in the study for one minute before exiting. We don't have any information about Carter's interactions with other agents, so we can't use assumption (2) to infer his thoughts. + +However, we do know that every agent tends to lie, so we can't trust any public claims made by other agents. We also know that agents tend to trust those who exited the room later than themselves, so we can assume that Carter may trust Alexander's private claim since Alexander exited the study after Carter. + +According to Alexander's private claim, the potato is in the blue_bottle, which is not one of the options given in the question. However, we can use this information to eliminate some of the options. The potato was moved from the blue_bathtub to the blue_pantry and then to the green_cupboard, so we can eliminate options A, E, and N. The potato was not moved to any of the red locations, so we can eliminate options F, G, H, I, and O. The potato was not moved to the green_treasure_chest, green_bucket, blue_drawer, green_basket, or red_drawer, so we can eliminate options D, J, L, M, and P. + +This leaves us with only one option: B. green_cupboard. Since we don't have any other information about Carter's thoughts or movements, we can assume that he thinks the potato is in the last place it was moved to before he left the study, which is the green_cupboard. Therefore, the answer is B. green_cupboard. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_10/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..56925275f38d513243cfb6a5c51a4cac781fb1c9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_10/order_2.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Jacob think Carter thinks the potato is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: To answer this question, we need to track where the potato was moved by each agent and who made public and private claims about its location. + +- Carter entered the study and made no movements, then exited. +- Avery moved the potato from the blue_bathtub to the blue_pantry, then exited. +- Jacob moved the potato from the blue_pantry to the green_cupboard, then exited. +- Jackson entered the study and made no movements, then exited. +- Alexander entered the study and made no movements, then exited. +- Jacob publicly claimed that the potato is in the blue_bathtub. +- Alexander privately told Jacob that the potato is in the blue_bottle. + +Based on this information, we know that the potato is not in the blue_bathtub, as Jacob lied about its location. We also know that Alexander knows the true location of the potato, but we don't know if Jacob trusts him or not. + +To determine where Jacob thinks Carter thinks the potato is, we need to consider their movements and interactions. Since Carter made no movements in the study, he did not move the potato. Therefore, Jacob cannot think that Carter thinks the potato is in the green_cupboard, as that was Jacob's own action. + +The only other option is that Jacob thinks Carter thinks the potato is still in the blue_bathtub, since that was the original location of the potato before Avery moved it. Jacob may assume that Carter did not see the potato being moved by Avery and therefore still believes it to be in the blue_bathtub. + +Therefore, the answer is A. blue_bathtub. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_10/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..0b73054f3f16e8770c998be3ddb35f8f7e1487fc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_10/order_3.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Alexander think Jacob thinks Carter thinks the potato is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: This question requires a bit of deduction and inference based on the given assumptions. We know that Alexander privately told Jacob that the potato is in the blue_bottle. However, Jacob publicly claimed that the potato is in the blue_bathtub. This means that Jacob is lying about the location of the potato. + +Now, we need to figure out where Alexander thinks Jacob thinks Carter thinks the potato is. Since Jacob is lying about the location of the potato, we cannot assume that he actually thinks the potato is in the blue_bathtub. However, we do know that Jacob moved the potato to the green_cupboard before leaving the study. + +Since Alexander privately told Jacob that the potato is in the blue_bottle, we can assume that Alexander thinks Jacob actually believes the potato is in the blue_bottle. Therefore, Alexander would think that Jacob thinks Carter thinks the potato is in the green_cupboard (since that is where Jacob moved the potato to). + +The answer is D. green_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_10/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..37b452739b5021b5b8fd5f250646741a61a2141d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_10/order_4.txt @@ -0,0 +1,57 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Jackson think Alexander thinks Jacob thinks Carter thinks the potato is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: This question requires a lot of logical reasoning and deduction. Let's break it down step by step: + +1. Where does Jackson think Alexander thinks Jacob thinks the potato is? +We need to start from the innermost layer of the question and work our way out. So, let's start with "Carter thinks the potato is in the..." and work our way outwards. + +2. Jacob publicly claimed that potato is in the blue_bathtub. +This means that Jacob wants everyone to believe that the potato is in the blue_bathtub. However, we don't know if this is true or false. + +3. Alexander privately told Jacob that the potato is in the blue_bottle. +This means that Alexander knows where the potato actually is, but he only told Jacob in private. We don't know if Jacob believes Alexander or not. + +4. Where does Alexander think Jacob thinks the potato is? +Since Alexander privately told Jacob where the potato is, we can assume that Alexander thinks Jacob knows where the potato is. However, we don't know if Alexander thinks Jacob is telling the truth or not. + +5. Where does Jackson think Alexander thinks Jacob thinks the potato is? +This is where it gets tricky. We don't have any direct information about what Jackson thinks, but we can make some assumptions based on the given information. We know that Jackson made no movements and stayed in the study for 1 minute, and he exited the study after Alexander. We also know that agents tend to trust agents who exited the room later than themselves. + +Based on this information, we can assume that Jackson trusts Alexander more than Jacob. Therefore, he might believe that Alexander is telling the truth about the potato being in the blue_bottle, and that Jacob is lying about it being in the blue_bathtub. However, we still don't know where Jackson thinks the potato actually is. + +6. Where does Carter think the potato is? +We don't have any direct information about where Carter thinks the potato is, but we do know that he made no movements and stayed in the study for 1 minute. Therefore, he might have seen where the potato was originally placed (in the blue_bathtub) before Avery moved it to the blue_pantry. + +7. Where does Avery think the potato is? +We know that Avery moved the potato from the blue_bathtub to the blue_pantry, so we can assume that he thinks the potato is in the blue_pantry. + +8. Where does Jacob think the potato is? +Jacob publicly claimed that the potato is in the blue_bathtub, but we don't know if he actually believes this or not. We do know that Alexander privately told him that the potato is in the blue_bottle, so he might be unsure about where the potato actually is. + +9. Where does Alexander think the potato is? +We know that Alexander privately told Jacob that the potato is in the blue_bottle, so we can assume that he thinks the potato is in the blue_bottle. + +Based on all of this information, we can eliminate all of the answer choices except for C (blue_bottle) and A (blue_bathtub). Jackson might believe that Alexander is telling the truth about the potato being in the blue_bottle, but he might also believe that Carter saw the potato in the blue_bathtub before it was moved. Therefore, we can't be sure where Jackson thinks the potato is. However, we do know that Alexander thinks the potato is in the blue_bottle, so that is the answer to the question. + +Therefore, the answer is C. blue_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_11/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a151ad35f7465292bed352204f534536ccad8bd8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_11/order_0.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where is the pear really? +Answer: red_pantry +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: To solve this question, we need to track the movements of the pear and the agents' interactions. + +1. The pear is initially in the blue_crate. +2. Ava moves the pear to the green_envelope. +3. Avery moves the pear to the red_pantry. +4. Isabella makes no movements and exits the lounge. +5. Mila makes no movements and exits the lounge. +6. Sophia makes no movements and exits the lounge. +7. Mila dislikes the pear. +8. All agents enter the waiting_room. +9. Isabella publicly claims that the pear is in the green_envelope. +10. Sophia privately tells Isabella that the pear is in the blue_crate. + +Based on this information, we can conclude that Isabella's claim is a lie because the pear was moved from the green_envelope to the red_pantry by Avery. Sophia's private claim contradicts Isabella's public claim, but we cannot trust Sophia's claim because she has no movements or interactions with the pear. Mila dislikes the pear, so we can assume she did not move it. + +Therefore, the pear is in the red_pantry, which is option C. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_11/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e9fa2ca10b2462cdccc9ffd2babf0d73ad2998f4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_11/order_1.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Sophia really think the pear is? +Answer: red_pantry +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: To answer this question, we need to consider the actions and interactions of the agents in the story. Sophia privately told Isabella that the pear is in the blue_crate. However, we also know that the agents tend to lie, so we cannot trust Sophia's statement. We need to look for other clues. + +Ava moved the pear to the green_envelope before exiting the lounge, and Isabella publicly claimed that the pear is in the green_envelope after they entered the waiting_room. This suggests that the pear is indeed in the green_envelope, and Isabella may have seen Ava move it there. + +Therefore, Sophia's real thought about the location of the pear is likely to be in the green_envelope. The answer is I. green_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_11/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a847b0c92a378ea4c6c2df919c984cc6b5c2f18d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_11/order_2.txt @@ -0,0 +1,27 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Ava think Sophia thinks the pear is? +Answer: green_envelope +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To answer this question, we need to track the movements of Ava and Sophia and their interactions with other agents. Ava moved the pear from the blue_crate to the green_envelope and then exited the lounge. Sophia made no movements and stayed in the lounge for 1 minute before exiting. Later, in the waiting_room, Isabella publicly claimed that the pear is in the green_envelope, while Sophia privately told Isabella that the pear is in the blue_crate. + +Since Ava exited the lounge before Sophia, she would tend to trust Sophia's claim more than Isabella's claim. Therefore, Ava would think that Sophia thinks the pear is in the blue_crate, which is Sophia's private claim. The answer is F. blue_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_11/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7022f8c4a15558ddcb37e6f6171204defead3be5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_11/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Avery think Ava thinks Sophia thinks the pear is? +Answer: green_envelope +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Avery think the pear is? According to the story, Avery moved the pear to the red_pantry before exiting the lounge. So, Avery thinks the pear is in the red_pantry. + +2. Where does Ava think the pear is? Ava moved the pear from the blue_crate to the green_envelope before exiting the lounge. So, Ava thinks the pear is in the green_envelope. + +3. Where does Sophia think the pear is? Sophia privately told Isabella that the pear is in the blue_crate. So, Sophia thinks the pear is in the blue_crate. + +4. Where does Isabella publicly claim the pear is? Isabella publicly claimed that the pear is in the green_envelope. + +5. Where does Mila think the pear is? The story tells us that Mila dislikes the pear, but it doesn't give us any information about where she thinks it is. + +Now, we need to determine where Avery thinks Ava thinks Sophia thinks the pear is. To do this, we need to consider the assumptions given in the story: + +- Avery can infer another agent's thought only if they have been in the same place or have had private or public interactions. +- Agents tend to trust agents that exited the room later than themselves. + +Based on these assumptions, we can conclude that Avery would trust Sophia's claim about the pear's location because she exited the lounge after him. However, he may not trust Isabella's claim because she exited before him. As for Ava, Avery would only be able to infer her thoughts if they had a private or public interaction. The story doesn't give us any information about this, so we can't determine where Avery thinks Ava thinks the pear is. + +Therefore, the answer to the question is: cannot be determined. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_11/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..de908025fe4f6d29d19fff71a9b3cf573c72cf52 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_11/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Mila think Avery thinks Ava thinks Sophia thinks the pear is? +Answer: green_envelope +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Mila think Avery thinks Ava thinks Sophia thinks the pear is? + +2. Mila dislikes the pear, so we can assume that she would not think the pear is in the green_envelope (where Ava moved it). + +3. Avery moved the pear to the red_pantry, so we can assume that he thinks the pear is in the red_pantry. + +4. Sophia privately told Isabella that the pear is in the blue_crate, so we can assume that Sophia thinks the pear is in the blue_crate. + +5. Isabella publicly claimed that the pear is in the green_envelope, but we know that Ava moved the pear to the green_envelope, so we can assume that Ava also thinks the pear is in the green_envelope. + +6. Mila did not make any movements or claims about the pear, so we don't have any direct information about where she thinks the pear is. + +7. However, we know that Mila exited the lounge after Sophia, and Mila tends to trust agents who exit later than herself. Therefore, Mila may trust Sophia's claim that the pear is in the blue_crate. + +8. Finally, we need to determine where Avery thinks Ava thinks Sophia thinks the pear is. We know that Avery moved the pear to the red_pantry, so he may think that the pear is in the red_pantry. However, we don't have any direct information about what Avery thinks about Sophia's claim or what he thinks Ava thinks. + +Based on the information we have, the best answer is probably H. red_pantry, since that is where Avery moved the pear and he may think that is where it is. However, there is some uncertainty about what Avery thinks about Sophia's claim and what he thinks Ava thinks, so it's possible that another answer could be correct. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_12/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..16d6f0cf4a8b4b09530ab83112e38b227b9f7e58 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_12/order_0.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where is the tangerine really? +Answer: red_basket +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To solve this question, we need to track the movements of the agents and their interactions. + +- Owen entered the front yard, made no movements, and exited. +- Logan entered the front yard, moved the tangerine to the green box, and exited. +- Elizabeth entered the front yard, moved the tangerine to the red basket, and exited. +- Alexander entered the front yard, made no movements, and exited. +- Ava entered the front yard, made no movements, and exited. +- Elizabeth publicly claimed that the tangerine is in the blue crate. +- Ava privately told Elizabeth that the tangerine is in the red basket. + +Based on the above information, we can eliminate some options. The tangerine is not in the blue crate because Elizabeth lied about it. The tangerine is not in the green crate or the green box because Logan and Elizabeth moved it from there. The tangerine is not in the red drawer, red bucket, blue drawer, green drawer, green bucket, red pantry, green envelope, blue pantry, blue treasure chest, or red container because there is no mention of it being there. + +Therefore, the tangerine is either in the red bottle, red basket, or red pantry. Elizabeth moved the tangerine to the red basket, but Ava privately told her that it is in the red basket. We know that Ava tends to lie, but we don't know if she lied in this case. However, we do know that Elizabeth publicly claimed that the tangerine is in the blue crate, which we know is a lie. Therefore, we can assume that Elizabeth is also lying about the tangerine being in the red basket. + +This leaves us with the option of the tangerine being in the red bottle or the red pantry. Since there is no mention of the tangerine being moved to the red pantry, the answer is most likely the red bottle. + +Therefore, the answer is K. red bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_12/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..44f6cc41027c32d18ee4e16e3427ad37b763121e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_12/order_1.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Ava really think the tangerine is? +Answer: red_basket +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To solve this question, we need to follow the movements of each agent and their interactions. According to the story, Owen, Logan, Elizabeth, Alexander, and Ava entered the front yard. Owen made no movements and stayed in the front yard for 1 minute before exiting. Logan moved the tangerine to the green box and then exited. Elizabeth moved the tangerine to the red basket and then exited. Alexander made no movements and stayed in the front yard for 1 minute before exiting. Ava made no movements and stayed in the front yard for 1 minute before exiting. + +Then, all five agents entered the waiting room. Elizabeth publicly claimed that the tangerine is in the blue crate, but Ava privately told Elizabeth that the tangerine is in the red basket. + +Based on this information, we can conclude that Ava knows the true location of the tangerine, and she told Elizabeth that it is in the red basket. Therefore, the answer is option O, red basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_12/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5058522945cd706b18928fb216a14878d48fc07 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_12/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Logan think Ava thinks the tangerine is? +Answer: green_box +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: To answer this question, we need to track the movements of the tangerine and the agents' interactions. + +1. Owen, Logan, Elizabeth, Alexander, and Ava entered the front yard. +2. The tangerine is in the red bottle. +3. Owen made no movements and stayed in the front yard for 1 minute. +4. Owen exited the front yard. +5. Logan moved the tangerine to the green box. +6. Logan exited the front yard. +7. Elizabeth moved the tangerine to the red basket. +8. Elizabeth exited the front yard. +9. Alexander made no movements and stayed in the front yard for 1 minute. +10. Alexander exited the front yard. +11. Ava made no movements and stayed in the front yard for 1 minute. +12. Ava exited the front yard. +13. Owen, Logan, Elizabeth, Alexander, and Ava entered the waiting room. +14. Elizabeth publicly claimed that the tangerine is in the blue crate. +15. Ava privately told Elizabeth that the tangerine is in the red basket. + +Based on the story and assumptions, we know that Logan moved the tangerine to the green box and then exited the front yard. Logan did not have any interactions with Ava, so he does not know where Ava thinks the tangerine is. However, Ava privately told Elizabeth that the tangerine is in the red basket. Therefore, Ava thinks the tangerine is in the red basket. + +The answer to the question is O. red basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_12/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9bd3abece56bc2d623250ba7da0cb90220081ed8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_12/order_3.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Owen think Logan thinks Ava thinks the tangerine is? +Answer: red_bottle +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bottle +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Where does Owen think Logan thinks the tangerine is? +- We know that Owen did not move the tangerine and did not publicly claim where it is. +- Logan moved the tangerine to the green_box and then exited the front_yard. +- Therefore, Owen knows that Logan thinks the tangerine is in the green_box. + +2. Where does Ava think the tangerine is? +- We don't know for sure where Ava thinks the tangerine is, but we do know that she privately told Elizabeth that it is in the red_basket. + +3. Where does Owen think Ava thinks the tangerine is? +- To answer this question, we need to consider the exit order and the private communication between Ava and Elizabeth. +- Owen exited the front_yard before Ava, so he would tend to trust her more than Logan or Elizabeth. +- Ava privately told Elizabeth that the tangerine is in the red_basket, so Owen would know that Ava thinks it is there. +- Therefore, Owen thinks that Ava thinks the tangerine is in the red_basket. + +4. Where does Owen think Logan thinks Ava thinks the tangerine is? +- To answer this question, we need to combine the previous two answers. +- Owen thinks that Logan thinks the tangerine is in the green_box. +- Owen thinks that Ava thinks the tangerine is in the red_basket. +- Therefore, Owen thinks that Logan thinks Ava thinks the tangerine is NOT in the green_box (since Ava privately told Elizabeth that it is in the red_basket). + +Based on this analysis, the answer is NOT N. green_box. Therefore, we can eliminate options N, K, and L. We also know that Owen thinks the tangerine is NOT in the green_box, so we can eliminate options D and F. Finally, we know that Ava privately told Elizabeth that the tangerine is in the red_basket, so the answer must be O. red_basket. Therefore, the answer is O. red_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_12/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1ef04a09daa45b7331bf033d6acabe82bce1ef7a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_12/order_4.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Elizabeth think Owen thinks Logan thinks Ava thinks the tangerine is? +Answer: red_bottle +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bottle +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Elizabeth think the tangerine is? +- Elizabeth publicly claimed that the tangerine is in the blue_crate. + +2. Where does Ava think the tangerine is? +- Ava privately told Elizabeth that the tangerine is in the red_basket. + +3. Where does Elizabeth think Ava thinks the tangerine is? +- We don't have any information about this. Elizabeth may or may not trust Ava's claim, and we don't know if they had any private interactions that would give Elizabeth more information. + +4. Where does Logan think the tangerine is? +- Logan moved the tangerine to the green_box. We don't know if Logan made any public or private claims about the tangerine's location. + +5. Where does Owen think Logan thinks the tangerine is? +- Owen made no movements and stayed in the front_yard for 1 minute, so he didn't see where the tangerine was moved. We don't have any information about Owen's thoughts on the matter. + +6. Where does Elizabeth think Owen thinks Logan thinks the tangerine is? +- This is the key part of the question. We know that Elizabeth publicly claimed that the tangerine is in the blue_crate, but we don't know if she trusts her own claim or if she has any reason to doubt it. We also don't know if Owen and Logan had any private or public interactions that would give Elizabeth more information about their thoughts. However, we do know that Owen exited the front_yard before Logan moved the tangerine to the green_box, so Elizabeth may assume that Owen thinks the tangerine is still in the front_yard. Therefore, Elizabeth may think that Owen thinks Logan thinks the tangerine is in the green_box. + +Based on this analysis, the answer is N. green_box. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_13/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..298beca6639386bd883883ccee6c00ee10846386 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_13/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where is the onion really? +Answer: red_crate +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: To solve this question, we need to track the movements and statements of each agent regarding the onion's location. + +- Elizabeth moved the onion to the green_bucket. +- Owen moved the onion to the red_crate. +- Jack privately told Elizabeth that the onion is in the red_crate. +- Liam privately told Noah that the onion is in the green_bucket. + +From these statements, we can conclude that the onion is actually in the green_bucket, as Liam's statement to Noah confirms Elizabeth's action of moving the onion to the green_bucket. Jack's statement to Elizabeth is a lie, as he dislikes the tomato and may have wanted to mislead her. + +Therefore, the answer is E. green_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_13/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..810b9c3ee82611755642539d0a93a689a5763fa9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_13/order_1.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Owen really think the onion is? +Answer: red_crate +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: To solve this question, we need to consider the movements and private interactions of the agents. According to the story, Owen moved the onion to the red_crate before exiting the cellar. However, we also know that Liam privately told Noah that the onion is in the green_bucket, and Jack privately told Elizabeth that the onion is in the red_crate. Since Owen did not have any private interactions with the other agents, he would only know where the onion is based on his own movements. Therefore, Owen really thinks the onion is in the red_crate, which is option A. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_13/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..046a5fb00fda2df185f335ec790f400401520122 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_13/order_2.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Elizabeth think Owen thinks the onion is? +Answer: green_bucket +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: To answer this question, we need to track the movements and interactions of Elizabeth and Owen regarding the onion. Elizabeth moved the onion to the green_bucket before exiting the cellar, while Owen moved the onion to the red_crate before exiting the cellar. Liam privately told Noah that the onion is in the green_bucket, and Jack privately told Elizabeth that the onion is in the red_crate. However, we cannot trust what Liam and Jack said, as all agents tend to lie. + +Based on the given assumptions, we know that Elizabeth can only infer Owen's thought if they have been in the same place or had private or public interactions. We also know that agents tend to trust a later-exiting agent. Since Owen exited the cellar after Elizabeth, she may trust his location of the onion more than Jack's claim. + +Therefore, Elizabeth may think that Owen thinks the onion is in the red_crate, as that is where he moved it before exiting the cellar. The answer is A. red_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_13/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5de15ee978bf3a749274bdd4a3f7bca52c59cf02 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_13/order_3.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Liam think Elizabeth thinks Owen thinks the onion is? +Answer: red_crate +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: To answer this question, we need to track the movements and private interactions of Liam, Elizabeth, and Owen regarding the onion's location. + +- Liam made no movements in the cellar and exited after Noah. +- Elizabeth moved the onion from the red_crate to the green_bucket and exited before Owen. +- Owen moved the onion from the green_bucket to the red_crate and exited last. + +We also know that Liam privately told Noah that the onion is in the green_bucket, and Jack privately told Elizabeth that the onion is in the red_crate. + +Based on this information, we can infer that Liam knows the onion was in the green_bucket when he left the cellar. He also knows that Elizabeth was in the cellar before Owen, so she must have seen the onion in the green_bucket before it was moved to the red_crate. However, Liam cannot be sure what Owen thinks about the onion's location because he did not have any private interactions with Owen. + +Therefore, Liam thinks Elizabeth thinks Owen thinks the onion is in the green_bucket. The answer is E. green_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_13/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0295970e114568390e2cce3ae9d2fd5d76ff34b6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_13/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Noah think Liam thinks Elizabeth thinks Owen thinks the onion is? +Answer: red_crate +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: To solve this question, we need to track the movements and private interactions of the agents to determine where each agent thinks the onion is located. + +- Noah made no movements and stayed in the cellar for 1 minute before exiting. He did not have any private interactions with Liam or Elizabeth. Therefore, we do not have any information about where he thinks the onion is located. + +- Liam made no movements and stayed in the cellar for 1 minute before exiting. He privately told Noah that the onion is in the green_bucket. Therefore, we know that Liam thinks the onion is in the green_bucket. + +- Elizabeth moved the onion to the green_bucket before exiting the cellar. She privately talked to Jack, who told her that the onion is in the red_crate. Therefore, we know that Elizabeth knows the onion is not in the green_bucket and thinks it is in the red_crate. + +- Owen moved the onion to the red_crate before exiting the cellar. We do not have any information about his private interactions or thoughts. + +Based on this information, we can determine that: + +- Liam thinks the onion is in the green_bucket. +- Elizabeth thinks the onion is in the red_crate. +- Owen's thoughts are unknown. +- Noah's thoughts are unknown. + +Therefore, the answer to the question is not determinable based on the given information. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_14/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f07c887660ec6df75a4bd5941c558e7b067b30c7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_14/order_0.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where is the tangerine really? +Answer: green_treasure_chest +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: To solve this question, we need to track the movements of the agents and their private conversations. According to the story, Benjamin moved the tangerine to the blue_pantry, but Elizabeth moved it back to the green_treasure_chest. Amelia privately told Mila that the tangerine is in the red_box, but we cannot trust her statement as the agents tend to lie. Chloe privately told Benjamin that the tangerine is in the green_treasure_chest, but again, we cannot trust her statement. Therefore, the only reliable information we have is that the tangerine was initially in the green_treasure_chest, and we know that Elizabeth moved it back there before leaving the attic. So, the answer is K. green_treasure_chest. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_14/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1da90647aa5e8ead2f3f64121257b90f96c155cf --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_14/order_1.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Mila really think the tangerine is? +Answer: red_box +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: To solve this question, we need to track the movements and private interactions of each agent. Mila entered the attic with the group, made no movements, and stayed for 1 minute before exiting. Chloe also made no movements and stayed for 1 minute before exiting. Amelia made no movements and stayed for 1 minute before exiting, but privately told Mila that the tangerine is in the red_box. Benjamin moved the tangerine to the blue_pantry before exiting, and Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. Elizabeth moved the tangerine to the green_treasure_chest before exiting. Mila, Chloe, Amelia, Benjamin, and Elizabeth then entered the waiting_room. + +Based on the assumptions given, we know that Mila can only infer the location of the tangerine based on her own observations and private interactions. She did not move or interact with the tangerine while in the attic, so she would not have known its location at that time. She did have a private interaction with Amelia, who told her that the tangerine is in the red_box. However, we do not know if Mila trusts Amelia or if she thinks Amelia is lying. We also do not know if Mila overheard Chloe telling Benjamin that the tangerine is in the green_treasure_chest. + +Therefore, the answer to the question is N. red_box, as that is the only location that Mila has direct knowledge of through a private interaction. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_14/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..08f1f90b316edeaf54f2fae5937664b45047f6a2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_14/order_2.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Amelia think Mila thinks the tangerine is? +Answer: red_box +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: To answer this question, we need to track the movements and private interactions of Mila and Amelia. Mila did not move in the attic and exited first, while Amelia stayed in the attic for a minute before exiting. In the waiting room, Amelia privately told Mila that the tangerine is in the red_box. However, we need to determine where Amelia thinks Mila thinks the tangerine is. + +Based on the story, there is no indication that Mila shared her thoughts on the location of the tangerine with Amelia. Therefore, Amelia's assumption about Mila's thoughts on the tangerine's location is purely speculative. We cannot determine where Amelia thinks Mila thinks the tangerine is based on the given information. + +The answer is not provided in the options given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_14/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..064421ab800b6dfa8f920f2f40e01bf97a30867b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_14/order_3.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Elizabeth think Amelia thinks Mila thinks the tangerine is? +Answer: green_treasure_chest +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: This question requires a bit of deduction and inference based on the given assumptions. We need to track the movements and private conversations of the agents to determine where Elizabeth thinks Amelia thinks Mila thinks the tangerine is. + +First, we know that Benjamin was told by Chloe that the tangerine is in the green_treasure_chest. However, we cannot trust this information as Chloe may be lying. + +Next, Amelia privately told Mila that the tangerine is in the red_box. Again, we cannot trust this information as Amelia may be lying. + +We also know that Elizabeth moved the tangerine to the green_treasure_chest after Benjamin moved it to the blue_pantry. This suggests that Elizabeth may believe the tangerine is in the green_treasure_chest. + +Finally, we need to determine where Amelia thinks Mila thinks the tangerine is. We know that Amelia privately told Mila that the tangerine is in the red_box. However, we cannot trust this information as Amelia may be lying. Therefore, we cannot determine where Amelia thinks Mila thinks the tangerine is. + +Based on the given information, we can only conclude that Elizabeth thinks the tangerine is in the green_treasure_chest. Therefore, the answer is (K) green_treasure_chest. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_14/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d3aad9e19e8d5567d66cd81f98b1329d8ce39bea --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_14/order_4.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Chloe think Elizabeth thinks Amelia thinks Mila thinks the tangerine is? +Answer: green_treasure_chest +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: This question requires a lot of steps to solve. Let's break it down: + +1. Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +2. Elizabeth moved the tangerine to the green_treasure_chest. +3. Amelia privately told Mila that the tangerine is in the red_box. +4. Chloe made no movements and stayed in the attic for 1 minute. +5. Chloe exited the attic later than Amelia and Benjamin. + +Based on assumption (4), Chloe trusts Benjamin more than Amelia. Therefore, Chloe believes that the tangerine is in the green_treasure_chest (from what Benjamin told her) and not in the red_box (from what Amelia told Mila). + +Now, we need to determine where Elizabeth thinks the tangerine is. Elizabeth moved the tangerine to the green_treasure_chest, so she definitely thinks it's there. We don't have any information about Elizabeth's thoughts on where the other characters think the tangerine is. + +Next, we need to determine where Amelia thinks the tangerine is. Amelia privately told Mila that the tangerine is in the red_box. We don't have any information about Amelia's thoughts on where the other characters think the tangerine is. + +Finally, we need to determine where Mila thinks the tangerine is. We don't have any direct information about Mila's thoughts on the location of the tangerine. However, we know that Mila was in the attic with the tangerine for one minute and made no movements. This could suggest that she was observing the tangerine and its location, but we can't be sure. + +Putting all of this together, we can conclude that Chloe thinks Elizabeth thinks Amelia thinks Mila thinks the tangerine is in the green_treasure_chest (option K). \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_15/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..be6b42e9d1baa6febc48a76766f90eb5094a2ab0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_15/order_0.txt @@ -0,0 +1,27 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where is the tangerine really? +Answer: red_basket +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To solve this question, we need to track the movements of the tangerine and the statements made by the agents. According to the story, the tangerine was initially in the red_basket (step 2). Sophia moved it to the green_bottle (step 5), and then Abigail moved it to the red_crate (step 9), and finally, Carter moved it back to the red_basket (step 11). Abigail publicly claimed that the tangerine is in the green_bottle (step 15), but we know that agents tend to lie. Carter privately told Ava that the tangerine is in the red_basket (step 16). + +Based on this information, we can conclude that the tangerine is actually in the red_basket, as confirmed by Carter's private statement to Ava. Therefore, the answer is option L. red_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_15/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5d20b5ed004e86c2e2f91510e966dd910062ad81 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_15/order_1.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Amelia really think the tangerine is? +Answer: green_bottle +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to determine where Amelia was when the tangerine was moved and if she had any interactions with other agents who may have given her information about the tangerine's location. According to the story, Amelia stayed in the cellar for 1 minute and made no movements, so she did not move the tangerine herself. Sophia moved the tangerine to the green bottle and Abigail later claimed that the tangerine was in the green bottle. However, we do not know if Amelia was present when Abigail made this claim or if she had any private interactions with Carter who told Ava that the tangerine was in the red basket. Therefore, we cannot determine with certainty where Amelia thinks the tangerine is. The answer is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_15/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b02bc75018899e9e270c43a65ed6d8f33af7eea --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_15/order_2.txt @@ -0,0 +1,31 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Ava think Amelia thinks the tangerine is? +Answer: red_basket +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To answer this question, we need to track the movements of Ava and Amelia and the location of the tangerine. Ava entered the cellar with Sophia, Amelia, Abigail, and Carter. She made no movements and stayed in the cellar for 1 minute before exiting. Amelia also made no movements and stayed in the cellar for 1 minute before exiting. Sophia moved the tangerine from the red_basket to the green_bottle before exiting. Abigail moved the tangerine from the green_bottle to the red_crate before exiting. Finally, Carter moved the tangerine from the red_crate to the red_basket before exiting. + +We know that Ava dislikes corn, but we don't have any information about her thoughts on the tangerine's location. However, we do know that Carter privately told Ava that the tangerine is in the red_basket. Since Ava and Amelia were both in the cellar at the same time, Ava could infer Amelia's thoughts on the tangerine's location. + +Based on the movements of the tangerine and the agents, we know that the tangerine is in the red_basket, which is where Carter told Ava it was. Therefore, Ava would think that Amelia also thinks the tangerine is in the red_basket. + +The answer is L. red_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_15/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5ae1f6c9a99d06cdf3cb67ba6c9dee213cf95769 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_15/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Carter think Ava thinks Amelia thinks the tangerine is? +Answer: red_basket +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: This question requires a lot of steps to solve. Let's break it down: + +1. We need to determine where Carter thinks the tangerine is. +2. We need to determine where Ava thinks the tangerine is. +3. We need to determine where Amelia thinks the tangerine is. +4. We need to determine where Carter thinks Ava thinks Amelia thinks the tangerine is. + +Step 1: Where does Carter think the tangerine is? +We know from the story that Carter privately told Ava that the tangerine is in the red_basket. Therefore, Carter thinks the tangerine is in the red_basket. + +Step 2: Where does Ava think the tangerine is? +We don't have any direct information about where Ava thinks the tangerine is. However, we do know that Ava dislikes the corn, which is not relevant to the question but is important to note. We also know that Ava made no movements in the cellar and exited before Sophia moved the tangerine to the green_bottle. Therefore, Ava could not have seen the tangerine in the green_bottle. We also know that Abigail publicly claimed that the tangerine is in the green_bottle, but we cannot assume that Ava believes this claim. Therefore, we cannot determine where Ava thinks the tangerine is. + +Step 3: Where does Amelia think the tangerine is? +We don't have any direct information about where Amelia thinks the tangerine is. We do know that Amelia made no movements in the cellar and exited before Abigail moved the tangerine to the red_crate. Therefore, Amelia could not have seen the tangerine in the red_crate. We also know that Abigail publicly claimed that the tangerine is in the green_bottle, but we cannot assume that Amelia believes this claim. Therefore, we cannot determine where Amelia thinks the tangerine is. + +Step 4: Where does Carter think Ava thinks Amelia thinks the tangerine is? +Since we cannot determine where Ava and Amelia think the tangerine is, we cannot determine where Carter thinks they think the tangerine is. Therefore, we cannot answer the question. + +The answer is: Cannot be determined. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_15/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9c5f226fbba243e0d833365b65496ec31f1d2806 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_15/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Abigail think Carter thinks Ava thinks Amelia thinks the tangerine is? +Answer: red_basket +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: This question requires a lot of steps to solve. Let's break it down: + +1. Abigail moved the tangerine to the red_crate and exited the cellar. +2. Carter privately told Ava that the tangerine is in the red_basket. +3. Ava dislikes the corn, so she wouldn't have moved the tangerine to the red_basket. +4. Therefore, Carter must have moved the tangerine to the red_basket after Abigail moved it to the red_crate. +5. Abigail publicly claimed that the tangerine is in the green_bottle, which we know is a lie based on step 2. +6. Abigail must be lying to throw off the other agents. +7. We need to figure out where Abigail thinks Carter thinks Ava thinks Amelia thinks the tangerine is. + +Based on the story, we know that Amelia made no movements and stayed in the cellar for 1 minute. Therefore, she couldn't have moved the tangerine to any of the locations listed in the answer choices. We also know that Sophia moved the tangerine to the green_bottle, but Abigail claimed that it was there, so we can't trust that information. + +The only two agents left are Ava and Carter. We know that Carter privately told Ava that the tangerine is in the red_basket, so we can assume that Ava knows where the tangerine is. However, we don't know if Ava shared this information with anyone else. + +Abigail is lying about the tangerine being in the green_bottle, so we can eliminate answer choices A, E, F, I, and K. We also know that the tangerine is not in the red_crate (where Abigail moved it) or the green_bottle (where Abigail claimed it was), so we can eliminate answer choices N and L. + +That leaves us with answer choices B, C, D, G, H, M, and O. We don't have any information to eliminate any of these choices, so we need to think about where Abigail might think the tangerine is based on her lies and the information she has. + +Abigail knows that the tangerine is not in the green_bottle (where she claimed it was), and she might suspect that it's not in the red_basket (since Ava knows where it is and might have told the other agents). Therefore, she might try to throw off the other agents by claiming that the tangerine is in a location that no one has mentioned yet. + +Based on this reasoning, Abigail might think that Carter thinks Ava thinks Amelia thinks the tangerine is in the blue_crate, blue_bathtub, green_drawer, green_pantry, green_box, red_box, green_bucket, or blue_bucket. We can't be sure which one she thinks it is, but those are the only options left. + +Therefore, the answer is either B, C, D, G, H, M, or O. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_16/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f42f62618193986209cb5b4f07e3bcbefec49608 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_16/order_0.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where is the tomato really? +Answer: red_crate +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: To solve this question, we need to follow the movements of the agents and their private interactions. + +1. Aiden and Isla entered the closet together. Aiden made no movements and stayed for 1 minute before exiting. Isla also made no movements and stayed for 1 minute before exiting. We don't know if they had any private interactions or not. + +2. Carter moved the tomato from the red_crate to the blue_container. We don't know if anyone saw him do this or not. + +3. Jack moved the tomato from the blue_container to the green_box. We don't know if anyone saw him do this or not. + +4. Evelyn moved the tomato from the green_box to the red_crate. We don't know if anyone saw her do this or not. + +5. All five agents entered the waiting_room together. Carter privately told Aiden that the tomato is in the green_box. Isla privately told Jack that the tomato is in the green_basket. We don't know if anyone else heard these private interactions or not. + +Based on this information, we can conclude that the tomato is in the green_box. This is because Carter told Aiden that the tomato is in the green_box, and Aiden would trust Carter because he exited the closet after Carter did. Additionally, Isla told Jack that the tomato is in the green_basket, but we don't have any reason to trust Isla's word since she could be lying. Therefore, the correct answer is M. green_box. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_16/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..27cfe91f8cc87a3213b08df855eabc44ce45733b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_16/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Jack really think the tomato is? +Answer: green_box +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: To solve this question, we need to follow the movements of each agent and their private interactions. We know that the tomato was initially in the red_crate, then moved to the blue_container by Carter, then to the green_box by Jack, and finally to the red_crate by Evelyn. Aiden and Isla made no movements and stayed in the closet for 1 minute each. + +After all the movements, Aiden, Isla, Carter, Jack, and Evelyn entered the waiting_room. Carter privately told Aiden that the tomato is in the green_box, and Isla privately told Jack that the tomato is in the green_basket. + +We need to determine where Jack really thinks the tomato is. We know that Jack moved the tomato to the green_box, so he knows that it was there at some point. However, we also know that Isla told Jack that the tomato is in the green_basket. Since Isla made no movements after entering the closet, she could not have moved the tomato to the green_basket. Therefore, Isla must be lying to Jack. + +Based on this, we can eliminate all options except for M (green_box) and O (green_basket). Since Isla lied to Jack, we cannot trust her claim that the tomato is in the green_basket. Therefore, Jack must believe that the tomato is in the green_box, making the answer M. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_16/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9771cfaa766e70f5445e480710cab2f50fbf524a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_16/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Isla think Jack thinks the tomato is? +Answer: green_basket +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: The question is asking where Isla thinks Jack thinks the tomato is. To answer this question, we need to follow the movements of Isla and Jack and their private conversation. + +Step 1: Isla entered the closet with Aiden, Carter, Jack, and Evelyn. She made no movements and stayed in the closet for 1 minute before exiting. + +Step 2: Jack moved the tomato to the green_box and then exited the closet. + +Step 3: Isla privately told Jack that the tomato is in the green_basket. + +Based on the assumption that an agent can only infer another agent's thought if they have been in the same place or have had private or public interactions, we know that Isla knows that Jack moved the tomato to the green_box. However, we don't know if Jack told Isla where he moved the tomato. + +Since Isla privately told Jack that the tomato is in the green_basket, we can assume that Isla thinks Jack thinks the tomato is in the green_basket. Therefore, the answer is O. green_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_16/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4c428481bda2d7cc758ff8ed3f67b71f3df36835 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_16/order_3.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Carter think Isla thinks Jack thinks the tomato is? +Answer: red_crate +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: This question is asking for a complex inference based on the actions and private conversations of multiple characters. To solve it, we need to track the movements of each character and their private conversations, and use the assumptions provided to make logical deductions. + +First, we know that the tomato starts in the red_crate, but is moved several times by different characters. Carter moves it to the blue_container, Jack moves it to the green_box, and Evelyn moves it back to the red_crate. Isla and Aiden do not move the tomato. + +Next, we need to consider the private conversations between Carter and Aiden, and Isla and Jack. Carter tells Aiden that the tomato is in the green_box, while Isla tells Jack that the tomato is in the green_basket. + +Based on these conversations, we can make some inferences about what each character knows or believes about the location of the tomato. Carter knows that the tomato is not in the red_crate or blue_container, but believes it is in the green_box. Aiden knows that the tomato is not in the red_crate or green_box, but does not know where it is. Isla knows that the tomato is not in the red_crate or green_basket, but does not know where it is. Jack knows that the tomato is not in the red_crate or green_basket, but believes it is in the green_box. + +To answer the question, we need to determine where Carter thinks Isla thinks Jack thinks the tomato is. This requires us to consider Carter's beliefs about the tomato's location, as well as his trust in the other characters based on their exit order. + +We know that Carter exited the closet before Jack and Evelyn, but after Isla and Aiden. This means he would tend to trust Isla more than Aiden, but would trust Jack and Evelyn more than either of them. + +Based on Isla's private conversation with Jack, we know that she believes the tomato is in the green_box. However, we need to determine where Carter thinks Isla thinks Jack thinks the tomato is. + +Since Carter trusts Jack more than Isla, he would be more likely to believe Jack's claim about the tomato's location than Isla's. Therefore, we can conclude that Carter thinks Isla thinks Jack thinks the tomato is in the green_box (option M). + +The correct answer is M. green_box. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_16/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5896cffdc15aab2f1c9a3b0861a1279c7d14fa52 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_16/order_4.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Aiden think Carter thinks Isla thinks Jack thinks the tomato is? +Answer: red_crate +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Aiden knows that the tomato was originally in the red_crate. +2. Aiden did not witness any movements of the tomato while he was in the closet. +3. Isla also did not witness any movements of the tomato while she was in the closet. +4. Carter moved the tomato from the red_crate to the blue_container. +5. Jack moved the tomato from the blue_container to the green_box. +6. Evelyn moved the tomato from the green_box to the red_crate. +7. Aiden, Isla, Carter, Jack, and Evelyn all exited the closet and entered the waiting_room. +8. Carter privately told Aiden that the tomato is in the green_box. +9. Isla privately told Jack that the tomato is in the green_basket. + +Based on this information, we can infer the following: + +- Aiden knows that the tomato was originally in the red_crate, but he does not know that it was moved to the blue_container and then to the green_box. +- Aiden trusts Carter because Carter exited the closet after him. +- Carter knows that the tomato is in the green_box because he moved it there and he told Aiden. +- Aiden does not know that Isla knows where the tomato is. +- Isla knows that the tomato is in the green_box because Jack moved it there and she told him. +- Aiden does not know that Jack knows where the tomato is. + +Now let's look at the question: Where does Aiden think Carter thinks Isla thinks Jack thinks the tomato is? + +To answer this question, we need to work backwards from Jack to Carter to Isla to Aiden. Here's the thought process: + +- Jack knows that the tomato is in the green_box because Isla told him. +- Isla knows that the tomato is in the green_box because she saw Jack move it there. +- Aiden does not know that Isla knows where the tomato is, so he cannot assume that Isla thinks anything about the tomato's location. +- Carter knows that the tomato is in the green_box because he moved it there and he told Aiden. +- Aiden trusts Carter because he exited the closet after him. +- Therefore, Aiden thinks that Carter thinks the tomato is in the green_box. + +The answer is M. green_box. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_17/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fcafdc3e09fae0c0dcb7803ef040ef6ca46578fe --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_17/order_0.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where is the green_pepper really? +Answer: blue_treasure_chest +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: To solve this question, we need to track the movements of the green pepper and the private conversations between the agents. According to the story, Alexander moved the green pepper from the blue crate to the blue suitcase, and then Evelyn moved it from the blue suitcase to the blue treasure chest. Hannah, Abigail, and Noah made no movements and stayed in the den for one minute each. Then, all five agents entered the waiting room. + +In the waiting room, Evelyn privately told Abigail that the green pepper is in the green envelope, but we cannot trust this information as agents tend to lie. However, Hannah privately told Alexander that the green pepper is in the blue crate, which means that the green pepper is actually in the blue crate. + +Therefore, the answer to the question is G. blue crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_17/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7747e64d3ff89cc30953458c54be8b189902cb38 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_17/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Alexander really think the green_pepper is? +Answer: blue_crate +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To solve this question, we need to track the movements and private interactions of each agent. According to the story and assumptions, we know that Alexander moved the green_pepper to the blue_suitcase and then exited the den. Hannah made no movements and stayed in the den for 1 minute, and then exited. Abigail and Noah also made no movements and stayed in the den for 1 minute each before exiting. Evelyn moved the green_pepper to the blue_treasure_chest before exiting the den. Hannah privately told Alexander that the green_pepper is in the blue_crate, and Evelyn privately told Abigail that the green_pepper is in the green_envelope. + +Based on this information, we can eliminate options A, B, D, E, H, K, N, and O because there is no mention of these locations in the story. We can also eliminate option C because although Evelyn told Abigail that the green_pepper is in the green_envelope, we know from the story that Evelyn actually moved the green_pepper to the blue_treasure_chest. + +This leaves us with options F, G, I, J, and L. We know that Hannah told Alexander that the green_pepper is in the blue_crate, but we also know that Alexander moved the green_pepper to the blue_suitcase before leaving the den. Therefore, we cannot trust Hannah's information. + +We also know that Alexander likes the green_cupboard, but there is no mention of him thinking that the green_pepper is there. + +This leaves us with options G, I, J, and L. Since Alexander moved the green_pepper to the blue_suitcase before leaving the den, it is most likely that he thinks the green_pepper is in the blue_suitcase (option I). Therefore, the answer is I. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_17/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d848fdca140c475d65e0ebd6f130c0b92a85f190 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_17/order_2.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Evelyn think Alexander thinks the green_pepper is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to track the movements of the green pepper and the interactions between Evelyn and Alexander. + +According to the story, Alexander initially moved the green pepper from the green crate to the blue suitcase. Then, Evelyn moved the green pepper from the blue suitcase to the blue treasure chest. + +Later on, Hannah privately told Alexander that the green pepper is in the blue crate. However, we don't know if Alexander believed her or not. + +Evelyn privately told Abigail that the green pepper is in the green envelope. We don't know if Abigail believed her or not. + +We are asked where Evelyn thinks Alexander thinks the green pepper is. Based on the story, we don't have any direct information about what Evelyn thinks about Alexander's thoughts. However, we can make some inferences based on the assumptions given. + +Assumption (2) tells us that Evelyn can only infer Alexander's thoughts if they have been in the same place or have had private or public interactions. We know that they were both in the den at the same time, but we don't have any information about any private or public interactions they had. + +Assumption (4) tells us that agents tend to trust agents that exited the room later than themselves. We know that Alexander exited the den before Evelyn did, so based on this assumption, Evelyn may be less likely to trust Alexander's thoughts about the green pepper. + +Based on the movements of the green pepper, it seems that Evelyn may think that Alexander thinks the green pepper is in the blue suitcase (where he initially moved it to). However, we can't say for certain since we don't have any direct information about what Evelyn thinks about Alexander's thoughts. + +Therefore, the answer is I. blue suitcase. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_17/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..78129ac76c9f52e529ea504ca2fcc4e2e1027efb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_17/order_3.txt @@ -0,0 +1,53 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Hannah think Evelyn thinks Alexander thinks the green_pepper is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Hannah think Evelyn thinks Alexander thinks the green_pepper is? + +2. We know that Hannah privately told Alexander that the green_pepper is in the blue_crate. + +3. We also know that Evelyn privately told Abigail that the green_pepper is in the green_envelope. + +4. We need to determine where Hannah thinks Evelyn thinks Alexander thinks the green_pepper is. + +5. To do this, we need to consider the movements of each agent and their interactions. + +6. Alexander moved the green_pepper to the blue_suitcase before exiting the den. + +7. Evelyn then moved the green_pepper to the blue_treasure_chest before exiting the den. + +8. Hannah made no movements and stayed in the den for 1 minute before exiting. + +9. Abigail and Noah also made no movements and stayed in the den for 1 minute before exiting. + +10. Based on the assumption that agents tend to trust those who exit the room later than themselves, Hannah would trust Abigail and Noah more than Alexander and Evelyn. + +11. However, since Hannah did not witness Alexander moving the green_pepper to the blue_suitcase, she may not trust his movements as much as Abigail and Noah's lack of movements. + +12. Therefore, Hannah may think that Evelyn thinks Alexander thinks the green_pepper is in the blue_treasure_chest, since that is where Evelyn moved it to before exiting the den. + +13. The answer is J. blue_treasure_chest. + +So, the answer is J. blue_treasure_chest. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_17/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c3aa193ea50b6c76bdca377a4481e67ec43eee4f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_17/order_4.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Abigail think Hannah thinks Evelyn thinks Alexander thinks the green_pepper is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Abigail thinks that the green pepper is in the green envelope, based on what Evelyn told her. +2. Evelyn likes the green cupboard, but we don't know if she has any thoughts about where the green pepper is. +3. Hannah privately told Alexander that the green pepper is in the blue crate, but we don't know if she has any thoughts about where anyone else thinks the green pepper is. +4. Alexander moved the green pepper to the blue suitcase before he exited the den, so he doesn't think it's in the blue crate anymore. +5. Hannah made no movements in the den and stayed there for one minute, so she doesn't have any new information about the green pepper's location. +6. Abigail made no movements in the den and stayed there for one minute, so she doesn't have any new information about the green pepper's location. +7. Noah made no movements in the den and stayed there for one minute, so he doesn't have any new information about the green pepper's location. +8. Alexander, Evelyn, Hannah, Abigail, and Noah all entered the waiting room together, so they all know that the green pepper is not in the den anymore. +9. Based on the assumption that agents tend to trust agents who exited the room later than themselves, Abigail would trust Noah's opinion the most, followed by Hannah, then Evelyn, then Alexander. + +Putting all of this together, we can conclude that Abigail thinks Hannah thinks that Evelyn thinks that the green pepper is in the green envelope. Therefore, the answer is F. green_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_18/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f482f6a5ca476d6f1b96ac64cfe7d7e2e82e4e21 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_18/order_0.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where is the cabbage really? +Answer: red_box +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: To solve this question, we need to track the movements of the cabbage and the statements made by the agents. According to the story, the cabbage was initially in the red_bucket in the master_bedroom. Logan moved it to the green_pantry and then Nathan moved it to the red_box. Isabella publicly claimed that the cabbage is in the red_box, but William privately told her that it is in the green_cupboard. However, we cannot trust what any agent says, so we need to rely on their movements. + +After the cabbage was moved to the red_box by Nathan, Isabella and Aiden stayed in the master_bedroom for a minute without making any movements. William also stayed in the master_bedroom for a minute without making any movements. Logan exited the master_bedroom before anyone else. + +Based on the assumption that an agent tends to trust an agent that exited the room later than himself, we can assume that William trusts Logan the most, followed by Aiden, Isabella, and Nathan. Therefore, we can eliminate any options that were not mentioned by Logan or William. + +Since Logan moved the cabbage to the green_pantry and William privately told Isabella that it is in the green_cupboard, we can conclude that the cabbage is most likely in the green_cupboard. Therefore, the answer is E. green_cupboard. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_18/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..45898b40d5b1094e15e1690bf604d3a086552696 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_18/order_1.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does William really think the cabbage is? +Answer: red_box +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: To answer this question, we need to follow William's movements and interactions with other agents. William lost his gloves in the master_bedroom and made no movements before exiting the room. In the waiting_room, he privately told Isabella that the cabbage is in the green_cupboard. Therefore, William thinks that the cabbage is in the green_cupboard. The answer is E. green_cupboard. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_18/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..54d6a685ef06d004ee732ac2745e5a20a5992ed1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_18/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does Nathan think William thinks the cabbage is? +Answer: red_box +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: To answer this question, we need to track the movements and interactions of Nathan and William regarding the cabbage. According to the story, Nathan moved the cabbage to the red_box and then exited the master_bedroom. William lost his gloves in the master_bedroom, made no movements for a minute, and then exited the master_bedroom. Later, in the waiting_room, Isabella publicly claimed that the cabbage is in the red_box, but William privately told Isabella that the cabbage is in the green_cupboard. + +Based on these movements and interactions, we can infer that Nathan and William were both in the master_bedroom at the same time, but there is no evidence that they had any private or public interactions there. Therefore, Nathan cannot directly infer what William thinks about the cabbage. + +However, we know that William privately told Isabella that the cabbage is in the green_cupboard. Since Nathan exited the master_bedroom after William, he may trust William's word more than Isabella's public claim. Therefore, Nathan may think that William thinks the cabbage is in the green_cupboard. + +The correct answer is E. green_cupboard. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_18/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..087a323647bf7812f90e82aa3944b89a8aeddf5a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_18/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does Aiden think Nathan thinks William thinks the cabbage is? +Answer: red_box +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. We need to determine who Aiden thinks Nathan thinks William thinks the cabbage is. This means we need to trace a chain of thoughts from Aiden to Nathan to William to the cabbage location. + +2. We know that Aiden lost his gloves and made no movements before exiting the master_bedroom. This means he did not move the cabbage or witness any movements by the other agents. + +3. Nathan moved the cabbage from the green_pantry to the red_box before exiting the master_bedroom. This means he knows the current location of the cabbage. + +4. William made no movements before exiting the master_bedroom, but he privately told Isabella that the cabbage is in the green_cupboard. This means he knows the actual location of the cabbage, but he may be lying to others. + +5. Based on the assumptions, Aiden can only infer William's thought if he has had a private interaction with him. However, there is no evidence that Aiden had a private interaction with William. + +6. Therefore, Aiden cannot know for sure where William thinks the cabbage is. He can only know where Nathan left the cabbage, which is in the red_box. + +7. Therefore, the answer is D. red_box. + +Note: It's important to carefully read and analyze the story and assumptions to determine what information is available and what can be inferred. It's also important to eliminate any distractors that do not have a clear connection to the question. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_18/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d3673cf2ec9674adc30228a331c95ecc79634165 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_18/order_4.txt @@ -0,0 +1,53 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does Logan think Aiden thinks Nathan thinks William thinks the cabbage is? +Answer: green_pantry +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Aiden think the cabbage is? +- We don't have any direct information about where Aiden thinks the cabbage is. We only know that he lost his gloves and made no movements before leaving the master bedroom. + +2. Where does Nathan think the cabbage is? +- Nathan moved the cabbage to the red box before leaving the master bedroom. +- Isabella publicly claimed that the cabbage is in the red box. +- William privately told Isabella that the cabbage is in the green cupboard. +- Based on this information, Nathan could believe that the cabbage is either in the red box or the green cupboard. + +3. Where does William think the cabbage is? +- William lost his gloves in the master bedroom. +- William privately told Isabella that the cabbage is in the green cupboard. +- Based on this information, William believes that the cabbage is in the green cupboard. + +4. Where does Nathan think William thinks the cabbage is? +- We don't have any direct information about what Nathan thinks William thinks about the cabbage's location. However, we know that Nathan exited the master bedroom after William, so he may be more likely to trust William's information. + +5. Where does Aiden think Nathan thinks William thinks the cabbage is? +- We don't have any direct information about what Aiden thinks about Nathan's or William's thoughts on the cabbage's location. However, we know that Aiden exited the master bedroom after Nathan, so he may be more likely to trust Nathan's information. + +6. Where does Logan think Aiden thinks Nathan thinks William thinks the cabbage is? +- Logan moved the cabbage to the green pantry before exiting the master bedroom. +- Based on this information, Logan believes that the cabbage is in the green pantry. +- We don't have any direct information about what Logan thinks about Aiden's, Nathan's, or William's thoughts on the cabbage's location. + +Putting it all together, we can conclude that Logan thinks Aiden thinks Nathan thinks the cabbage is either in the red box or the green cupboard. However, we cannot determine a specific answer choice from the given options. Therefore, the answer is not provided in the multiple-choice options given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_19/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5d985a642b0af39b47f71c90250d356c6033df7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_19/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where is the green_pepper really? +Answer: blue_crate +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To solve this question, we need to follow the movements of each agent and their interactions. + +1. Abigail, Lily, Ella, Logan, and Elizabeth entered the den. +2. The green_pepper is in the red_drawer. +3. Abigail made no movements and stayed in the den for 1 minute. +4. Abigail exited the den. +5. Lily made no movements and stayed in the den for 1 minute. +6. Lily exited the den. +7. Ella made no movements and stayed in the den for 1 minute. +8. Ella exited the den. +9. Logan moved the green_pepper to the blue_crate. +10. Logan exited the den. +11. Elizabeth made no movements and stayed in the den for 1 minute. +12. Elizabeth exited the den. +13. Abigail, Lily, Ella, Logan, and Elizabeth entered the waiting_room. +14. Ella publicly claimed that green_pepper is in the red_pantry. +15. Elizabeth privately told Ella that the green_pepper is in the red_drawer. + +Based on the interactions, we know that Ella lied about the location of the green_pepper, as Elizabeth privately told her that it is in the red_drawer. We also know that Logan moved the green_pepper to the blue_crate. + +Therefore, the correct answer is D. blue_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_19/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d7c89765c611196ec57c6624dd2b69ec9632f7a6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_19/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Logan really think the green_pepper is? +Answer: blue_crate +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To answer this question, we need to follow Logan's movements and interactions with other agents. Logan moved the green_pepper to the blue_crate and then exited the den. After that, Elizabeth privately told Ella that the green_pepper is in the red_drawer. However, we don't know if Logan overheard this conversation or not. Based on the given information, we can assume that Logan tends to lie like other agents. Therefore, we cannot trust his public claims. We also don't know if Logan had any private interactions with other agents. So, the only reliable information we have is that Logan moved the green_pepper to the blue_crate. Therefore, the answer is D. blue_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_19/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6dd25adedfec3cb1354f1fcf9ca0a4b8545469ef --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_19/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Lily think Logan thinks the green_pepper is? +Answer: red_drawer +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: To answer this question, we need to track the movements and interactions of Lily and Logan regarding the green_pepper. According to the story, Logan moved the green_pepper to the blue_crate before exiting the den. Lily made no movements in the den and exited after Logan. There is no mention of any private or public interactions between Lily and Logan regarding the green_pepper. Therefore, we cannot infer where Lily thinks Logan thinks the green_pepper is. The answer is not given in the story, so the correct answer is not listed among the options. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_19/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..037dd3e12c9328c40dc36aeb4f1ce025b11f0910 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_19/order_3.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Ella think Lily thinks Logan thinks the green_pepper is? +Answer: red_drawer +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: The question is asking for Ella's belief about Lily's belief about Logan's belief about the location of the green pepper. To solve this question, we need to track the movements of each agent and their public and private claims. + +1. Abigail, Lily, Ella, Logan, and Elizabeth entered the den. +2. The green pepper is in the red drawer. +3. Abigail made no movements and stayed in the den for 1 minute. +4. Abigail exited the den. +5. Lily made no movements and stayed in the den for 1 minute. +6. Lily exited the den. +7. Ella made no movements and stayed in the den for 1 minute. +8. Ella exited the den. +9. Logan moved the green pepper to the blue crate. +10. Logan exited the den. +11. Elizabeth made no movements and stayed in the den for 1 minute. +12. Elizabeth exited the den. +13. Abigail, Lily, Ella, Logan, and Elizabeth entered the waiting room. +14. Ella publicly claimed that the green pepper is in the red pantry. +15. Elizabeth privately told Ella that the green pepper is in the red drawer. + +Based on the above information, we know that Logan moved the green pepper to the blue crate before exiting the den. However, we don't know if any of the other agents saw him do this or if they have any knowledge of the green pepper's location. + +Ella publicly claimed that the green pepper is in the red pantry, but we don't know if she actually believes this or if she is lying. Elizabeth privately told Ella that the green pepper is in the red drawer, so Ella knows the true location of the green pepper. + +We don't have any information about Lily's knowledge of the green pepper's location or her movements after exiting the den. Therefore, we cannot determine where Ella thinks Lily thinks Logan thinks the green pepper is. + +The answer is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_19/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..aea99ee3c6308ef7a37655854c8f84cdc0dc8d1c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_19/order_4.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Elizabeth think Ella thinks Lily thinks Logan thinks the green_pepper is? +Answer: red_drawer +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: This question requires a bit of logic and deduction. Let's break it down step by step: + +1. Elizabeth privately told Ella that the green_pepper is in the red_drawer. +2. Ella publicly claimed that green_pepper is in the red_pantry. +3. Lily made no movements and stayed in the den for 1 minute. +4. Logan moved the green_pepper to the blue_crate. + +Based on these steps, we can infer that Elizabeth knows the true location of the green_pepper (in the red_drawer) and that Ella is lying about its location (claiming it's in the red_pantry). We also know that Logan moved the green_pepper to the blue_crate, so we can eliminate any options that don't involve the blue_crate. + +Now we need to figure out where Elizabeth thinks Ella thinks Lily thinks Logan thinks the green_pepper is. Since Ella is lying about the location, we can't trust her claim that it's in the red_pantry. We also know that Lily didn't move the green_pepper, so she doesn't have any special knowledge about its location. That leaves us with Logan and his movement of the green_pepper to the blue_crate. + +Since Elizabeth knows the true location of the green_pepper and that Logan moved it to the blue_crate, she may assume that Ella is trying to throw others off the trail by claiming it's in the red_pantry. Therefore, Elizabeth may think that Ella thinks Logan thinks the green_pepper is in the blue_crate. + +So the answer is D. blue_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_2/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2a218d3702817b78d3008724c5b3c39ac097be44 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_2/order_0.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where is the lemon really? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: To solve this question, we need to track the movements of the lemon and the private conversations between the agents. According to the story, Abigail moved the lemon from the blue_bathtub to the blue_treasure_chest, then Avery moved it to the blue_pantry, and finally Lily moved it back to the blue_bathtub. Liam privately told Noah that the lemon is in the blue_treasure_chest, but we know that Liam tends to lie. Avery privately told Abigail that the lemon is in the green_drawer, but we don't know if Avery is telling the truth or lying. Therefore, we cannot trust Avery's claim. Based on the movements of the lemon, the correct answer is A. blue_bathtub. + +a: \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_2/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..aebea79c0790164740f1dbc6f9010e16541c0e00 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_2/order_1.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Lily really think the lemon is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: To answer this question, we need to follow Lily's movements with the lemon. According to the story, Lily moved the lemon to the blue bathtub (step 3), then later moved it to the blue pantry (step 12). We also know that Avery privately told Abigail that the lemon is in the green drawer (step 16), but we cannot assume that this is true since agents tend to lie. Therefore, Lily's actual thought about the lemon's location is either the blue bathtub or the blue pantry. The answer is A. blue_bathtub. + +a: \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_2/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..349dca2bd91c2b98194b0327b0d96ebb0a7eba9e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_2/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Avery think Lily thinks the lemon is? +Answer: blue_pantry +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: To answer this question, we need to track the movements of the lemon and the agents' interactions. Here are the steps to solve the question: + +1. Abigail, Liam, Avery, Noah, and Lily entered the garage. +2. The lemon is in the blue_bathtub. +3. Abigail moved the lemon to the blue_treasure_chest. +4. Lily dislikes the cabbage. +5. Abigail exited the garage. +6. Liam made no movements and stayed in the garage for 1 minute. +7. Liam exited the garage. +8. Avery moved the lemon to the blue_pantry. +9. Avery exited the garage. +10. Noah made no movements and stayed in the garage for 1 minute. +11. Noah exited the garage. +12. Lily moved the lemon to the blue_bathtub. +13. Lily exited the garage. + +Based on the above steps, we know that Lily moved the lemon to the blue_bathtub before exiting the garage. However, we don't know if Avery witnessed this movement or not. We only know that Avery moved the lemon to the blue_pantry after Abigail moved it to the blue_treasure_chest. + +Next, we need to consider the private interaction between Avery and Abigail. Avery told Abigail that the lemon is in the green_drawer. However, we know that Avery moved the lemon to the blue_pantry, not the green_drawer. This means that Avery lied to Abigail. + +Since we don't have any information about Avery's private or public interactions with Lily, we cannot determine where Avery thinks Lily thinks the lemon is. Therefore, the answer is not provided in the given options. + +a: 5 6 7 9 1 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_2/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6389af912e4cba2a55319e9a9148d64976d59739 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_2/order_3.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Liam think Avery thinks Lily thinks the lemon is? +Answer: blue_treasure_chest +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: This question requires a bit of deduction and inference. We need to start with Liam's private conversation with Noah, where he tells him that the lemon is in the blue_treasure_chest. From this, we can infer that Liam knows where the lemon is. + +Next, we need to consider Avery's private conversation with Abigail, where he tells him that the lemon is in the green_drawer. We don't know if Avery is lying or telling the truth, but we do know that Liam was not present for this conversation, so he does not know where Avery thinks the lemon is. + +Finally, we need to consider where Lily thinks the lemon is. We know that Abigail moved the lemon to the blue_treasure_chest, but we don't know if Lily knows this. We also know that Avery moved the lemon to the blue_pantry, but we don't know if Lily knows this either. + +However, we do know that Lily moved the lemon to the blue_bathtub. We also know that Liam was present when Lily entered the garage and when she exited, so he knows that Lily moved the lemon to the blue_bathtub. + +Putting all of this together, we can infer that Liam thinks Avery thinks Lily thinks the lemon is in the blue_bathtub. Therefore, the answer is A. blue_bathtub. + +a: 2 1 5 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_2/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9bd0d1a564b17ef825bad0f4167e78ca16903f4d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_2/order_4.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Noah think Liam thinks Avery thinks Lily thinks the lemon is? +Answer: blue_treasure_chest +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Noah thinks the lemon is in the blue_treasure_chest (according to Liam's private message to him). +2. Liam thinks the lemon is in the blue_treasure_chest (according to his private message to Noah). +3. Avery thinks the lemon is in the green_drawer (according to his private message to Abigail). +4. Abigail lost his watch and did not receive any private messages about the lemon's location. +5. Lily moved the lemon to the blue_bathtub, but we are not asked about her thoughts. + +So, we need to determine where Noah thinks Liam thinks Avery thinks the lemon is. Based on the information we have, we know that Liam thinks the lemon is in the blue_treasure_chest, and Avery thinks the lemon is in the green_drawer. However, we don't know where Liam thinks Avery thinks the lemon is. + +We can make some assumptions based on the given information. Since Liam did not move the lemon and stayed in the garage for 1 minute, he may not have seen Avery move the lemon to the blue_pantry. Therefore, he may still think the lemon is in the blue_treasure_chest. However, we cannot be certain. + +Noah, on the other hand, received a private message from Liam stating that the lemon is in the blue_treasure_chest. Therefore, he may also think that Avery thinks the lemon is in the blue_treasure_chest, since he has no reason to doubt Liam's message. + +Based on this analysis, the answer is E. blue_treasure_chest. + +a: 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_20/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..070f6a9cc361ea5cee92d8ff3769421f67cc0e53 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_20/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where is the peach really? +Answer: blue_treasure_chest +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: To solve this question, we need to track the movements and private interactions of each agent. + +- Hannah made no movements in the patio and did not have any private interactions, so we can eliminate any answer choices that involve her. +- Liam moved the peach from the red_basket to the blue_treasure_chest and privately told Avery that the peach is in the red_bottle. However, we know that agents tend to lie, so we cannot trust Liam's claim to Avery. Therefore, we cannot eliminate any answer choices based on Liam's actions. +- Benjamin made no movements in the patio but privately told Hannah that the peach is in the red_envelope. Again, we cannot trust Benjamin's claim, so we cannot eliminate any answer choices based on his actions. +- Avery made no movements in the patio and did not have any private interactions, so we can eliminate any answer choices that involve her. +- Mila made no movements in the patio and did not have any private interactions, so we can eliminate any answer choices that involve her. + +Therefore, the only answer choice that remains is M. red_envelope. While we cannot trust Benjamin's claim, we also cannot eliminate it as a possibility. Liam's actions suggest that he moved the peach from the red_basket to the blue_treasure_chest, but we cannot be certain that this is where the peach actually is. Therefore, the only answer choice that we can confidently choose is M. red_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_20/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..54ea9bed2b213bf379cde0dd067473f2182b8f01 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_20/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Avery really think the peach is? +Answer: blue_treasure_chest +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: To solve this question, we need to consider the private conversation between Liam and Avery. Liam told Avery that the peach is in the red_bottle. However, we know that agents tend to lie, so we cannot trust Liam's statement. We also know that Avery made no movements and stayed in the patio for 1 minute, so she did not witness Liam moving the peach to the blue_treasure_chest. Therefore, we cannot assume that Avery knows the peach is in the blue_treasure_chest. + +However, we do know that Benjamin privately told Hannah that the peach is in the red_envelope. Since Avery and Benjamin were both in the patio at the same time, Avery could have overheard Benjamin's statement. Therefore, we can assume that Avery thinks the peach is in the red_envelope. + +The answer is M. red_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_20/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..781297bfb882a4bab6506a2ae76428e378318b85 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_20/order_2.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Liam think Avery thinks the peach is? +Answer: red_bottle +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bottle +GPT-4 Explain: To answer this question, we need to track Liam's movements and private communication. Liam moved the peach to the blue_treasure_chest and privately told Avery that the peach is in the red_bottle. However, we don't know where Liam thinks Avery thinks the peach is. We only know that Liam told Avery that the peach is in the red_bottle. Therefore, the answer is N. red_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_20/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..33bc061341fbcbe4d30055cf90718abf783213d5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_20/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Benjamin think Liam thinks Avery thinks the peach is? +Answer: blue_treasure_chest +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: This question requires a bit of deduction and inference. Let's break it down step by step: + +1. Benjamin privately told Hannah that the peach is in the red_envelope. +2. Liam privately told Avery that the peach is in the red_bottle. +3. We need to figure out where Benjamin thinks Liam thinks Avery thinks the peach is. + +Based on the assumptions given, we know that Benjamin can only infer Liam's thoughts if they had a private interaction. We also know that agents tend to lie, so what Liam told Avery may not be true. However, we can use the information given to make some deductions. + +We know that Liam lost his gloves twice, which means he entered and exited the patio twice. We also know that Liam moved the peach from the red_basket to the blue_treasure_chest. This means that Liam had access to the peach and could have moved it again. + +Now, let's look at what Benjamin knows. He privately told Hannah that the peach is in the red_envelope. This means that he either saw the peach in the red_envelope or heard it from someone else. He also knows that Liam lost his gloves twice, so he may suspect that Liam moved the peach. + +Finally, we need to figure out where Avery thinks the peach is. According to Liam, Avery thinks the peach is in the red_bottle. However, we know that Liam may be lying. + +Putting all of this together, we can make an educated guess about where Benjamin thinks Liam thinks Avery thinks the peach is. Since Liam moved the peach from the red_basket to the blue_treasure_chest, Benjamin may suspect that Liam thinks the peach is in the blue_treasure_chest. However, since Liam told Avery that the peach is in the red_bottle, Benjamin may also suspect that Liam thinks Avery thinks the peach is in the red_bottle. + +Therefore, the answer is either O. blue_treasure_chest or N. red_bottle. We can't be sure which one is correct, but we can make an educated guess based on the information given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_20/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e04424c9eb1a33e34fd0adf4d3a425894fdc253e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_20/order_4.txt @@ -0,0 +1,64 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Hannah think Benjamin thinks Liam thinks Avery thinks the peach is? +Answer: red_basket +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Liam think the peach is? +- According to step 3, the peach is in the red_basket. +- However, in step 7, Liam moved the peach to the blue_treasure_chest. +- Finally, in step 16, Benjamin privately told Hannah that the peach is in the red_envelope. +- Since we know that agents tend to lie, we cannot trust what Benjamin told Hannah. Therefore, we can only rely on steps 3 and 7 to determine where Liam thinks the peach is. +- Liam initially thought the peach was in the red_basket, but then moved it to the blue_treasure_chest. Therefore, Liam thinks the peach is in the blue_treasure_chest. + +2. Where does Avery think the peach is? +- According to step 3, the peach is in the red_basket. +- However, in step 16, Benjamin privately told Hannah that the peach is in the red_envelope. +- Since we cannot trust what Benjamin told Hannah, we can only rely on step 3 to determine where Avery thinks the peach is. +- Avery thinks the peach is in the red_basket. + +3. Where does Liam think Avery thinks the peach is? +- According to step 16, Liam privately told Avery that the peach is in the red_bottle. +- However, we know that agents tend to lie, so we cannot trust what Liam told Avery. +- Since we already determined that Liam thinks the peach is in the blue_treasure_chest, we cannot use that information to determine where Liam thinks Avery thinks the peach is. +- Therefore, we cannot answer this part of the question. + +4. Where does Benjamin think Liam thinks Avery thinks the peach is? +- According to step 16, Benjamin privately told Hannah that the peach is in the red_envelope. +- Since we cannot trust what Benjamin told Hannah, we need to use other information to determine where Benjamin thinks Liam thinks Avery thinks the peach is. +- We know that Liam thinks the peach is in the blue_treasure_chest, and we know that Benjamin was in the same place as Liam before he exited the patio. +- Therefore, Benjamin would tend to trust Liam's opinion more than his own, since Liam exited the patio after Benjamin. +- Since we already determined that Avery thinks the peach is in the red_basket, and Liam thinks it's in the blue_treasure_chest, we need to determine where Benjamin thinks Liam thinks Avery thinks the peach is. +- Since Liam thinks the peach is in the blue_treasure_chest, and Avery thinks it's in the red_basket, Benjamin would tend to trust Liam's opinion more than Avery's. +- Therefore, Benjamin thinks that Liam thinks Avery thinks the peach is in the blue_treasure_chest. + +5. Where does Hannah think Benjamin thinks Liam thinks Avery thinks the peach is? +- According to step 16, Benjamin privately told Hannah that the peach is in the red_envelope. +- Since we cannot trust what Benjamin told Hannah, we need to use other information to determine where Hannah thinks Benjamin thinks Liam thinks Avery thinks the peach is. +- We know that Benjamin thinks Liam thinks Avery thinks the peach is in the blue_treasure_chest. +- However, we need to determine where Hannah thinks Benjamin thinks this. +- We know that Hannah was in the same place as Benjamin before he exited the patio, so she would tend to trust his opinion more than her own. +- Therefore, Hannah thinks that Benjamin thinks Liam thinks Avery thinks the peach is in the blue_treasure_chest, even though she may not know where the peach actually is. + +Answer: O. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_3/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0fbb3489013d4954c2495b5459637bd3e53974ed --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_3/order_0.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where is the onion really? +Answer: red_drawer +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: To solve this question, we need to track the movements of the onion and the agents. Emily moved the onion from the green_crate to the blue_pantry, and Liam moved it from the blue_pantry to the red_drawer. Avery, Elizabeth, and Lily made no movements and stayed in the hallway for one minute each. Then, Emily, Liam, Avery, Elizabeth, and Lily entered the waiting_room. Avery privately told Emily that the onion is in the blue_bottle, and Liam privately told Elizabeth that the onion is in the blue_treasure_chest. + +Based on the assumptions given, we know that the agents tend to lie, so we cannot trust what Avery and Liam said. We also know that the agents tend to trust an agent that exited the room later than themselves, so we can assume that Emily and Liam are more trustworthy than Avery, Elizabeth, and Lily. + +Therefore, the onion is most likely in the last place we saw it, which is the red_drawer. The correct answer is E. red_drawer. + +a: \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_3/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..818d4986e2826def93708d537dcd8e817e02e31e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_3/order_1.txt @@ -0,0 +1,30 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Lily really think the onion is? +Answer: red_drawer +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: To answer this question, we need to track the movements of the onion and the agents' interactions. Emily moved the onion from the green_crate to the blue_pantry, and Liam moved it from the blue_pantry to the red_drawer. Avery, Elizabeth, and Lily made no movements and stayed in the hallway for one minute each. Then, all five agents entered the waiting_room. Avery privately told Emily that the onion is in the blue_bottle, and Liam privately told Elizabeth that the onion is in the blue_treasure_chest. + +Since Lily did not have any private or public interactions regarding the onion's location, we need to determine who she trusts the most based on the exit order. Lily exited the hallway last, so she would trust Emily's claim the most. Emily moved the onion to the blue_pantry, so Lily really thinks the onion is in the blue_pantry. + +Therefore, the answer is D. blue_pantry. + +a: 9 2 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_3/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a4f896d15feb4354aabe9b1e7fd9da2c453536b4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_3/order_2.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Avery think Lily thinks the onion is? +Answer: red_drawer +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: To answer this question, we need to track Avery's movements and interactions with other agents. Avery entered the hallway with Emily, Liam, Elizabeth, and Lily. Avery made no movements and stayed in the hallway for 1 minute before exiting. Emily moved the onion from the green_crate to the blue_pantry before exiting. Liam then moved the onion from the blue_pantry to the red_drawer before exiting. + +In the waiting_room, Avery privately told Emily that the onion is in the blue_bottle. This means that Avery knows the true location of the onion. However, we need to determine where Avery thinks Lily thinks the onion is. + +There is no indication that Avery had any private or public interactions with Lily. The only information we have about Lily is that she made no movements and stayed in the hallway for 1 minute before exiting. Therefore, we cannot determine where Avery thinks Lily thinks the onion is based on the given information. + +The answer is none of the above (not listed as an option). + +a: 1 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_3/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5481ddea85bf27f85c720a90450ec30d07773fd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_3/order_3.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Emily think Avery thinks Lily thinks the onion is? +Answer: blue_pantry +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: This question requires a bit of deduction and inference. Let's break it down step by step: + +1. Where does Emily think the onion is? +- Emily moved the onion to the blue_pantry, so she knows it's not in the green_crate, red_drawer, or any of the other options except for blue_pantry. + +2. Where does Avery think the onion is? +- Avery privately told Emily that the onion is in the blue_bottle, but we know that agents tend to lie. So we can't trust this information completely. +- Avery was in the hallway for 1 minute and made no movements, so she didn't see where the onion was moved to. +- However, Avery exited the hallway after Elizabeth and Lily, so she might trust their information more than her own observations. +- Elizabeth privately told Liam that the onion is in the blue_treasure_chest, but we know that agents tend to lie. So we can't trust this information completely either. +- Therefore, Avery might think the onion is in the blue_treasure_chest based on Elizabeth's claim. + +3. Where does Lily think the onion is? +- Lily made no movements and stayed in the hallway for 1 minute, so she didn't see where the onion was moved to. +- Lily exited the hallway after Elizabeth, so she might trust Elizabeth's information more than her own observations. +- Therefore, Lily might think the onion is in the blue_treasure_chest based on Elizabeth's claim. + +4. Where does Emily think Avery thinks Lily thinks the onion is? +- Emily knows that Avery might think the onion is in the blue_treasure_chest based on Elizabeth's claim. +- Emily doesn't have any information about where Lily thinks the onion is, but she knows that Lily might trust Elizabeth's information more than her own observations. +- Therefore, Emily might think that Avery thinks Lily thinks the onion is in the blue_treasure_chest. + +Answer: C. blue_treasure_chest + +a: 7 9 6 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_3/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..71da91f3630fd8ebf0b5abea368ba6e81ca9a773 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_3/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Elizabeth think Emily thinks Avery thinks Lily thinks the onion is? +Answer: blue_pantry +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Emily think the onion is? +- Emily moved the onion from the green_crate to the blue_pantry, so she knows it's not in the green_crate anymore. We don't know if she heard Avery's claim that it's in the blue_bottle, so we can't assume she thinks it's there. Therefore, Emily likely thinks the onion is in the blue_pantry. + +2. Where does Avery think Lily thinks the onion is? +- Avery made no movements and stayed in the hallway for 1 minute, so she didn't see where the onion was moved. However, she privately told Emily that the onion is in the blue_bottle. We don't know if Lily heard this claim, so we can't assume she thinks it's there. Therefore, we can't determine where Avery thinks Lily thinks the onion is. + +3. Where does Elizabeth think Liam thinks the onion is? +- Liam moved the onion from the blue_pantry to the red_drawer, so Elizabeth knows it's not in the blue_pantry anymore. Liam privately told Elizabeth that the onion is in the blue_treasure_chest, but we don't know if she trusts him or not. Therefore, Elizabeth likely thinks the onion is in the blue_treasure_chest, but she may have some doubt. + +4. Where does Lily think the onion is? +- Lily made no movements and stayed in the hallway for 1 minute, so she didn't see where the onion was moved. We don't know if she heard Avery's claim that it's in the blue_bottle, so we can't assume she thinks it's there. Therefore, we can't determine where Lily thinks the onion is. + +5. Where does Elizabeth think Emily thinks Avery thinks Lily thinks the onion is? +- Based on our previous analysis, we know that Emily likely thinks the onion is in the blue_pantry and we can't determine where Avery thinks Lily thinks the onion is. However, Elizabeth knows that Liam privately told her that the onion is in the blue_treasure_chest. Since Elizabeth trusts Liam more than Avery (because he exited the hallway later), she may believe that the onion is actually in the blue_treasure_chest. Therefore, Elizabeth likely thinks that Emily thinks Avery thinks Lily thinks the onion is in the blue_treasure_chest. + +Answer: C. blue_treasure_chest + +a: 2 6 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_4/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7a3c20a13e6ac753be462c4013a5e5cd0d2f5d80 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_4/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where is the cherry really? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: To solve this question, we need to track the movements and private interactions of each agent. According to the story, Jackson privately told Abigail that the cherry is in the green_bucket. However, we know that every agent tends to lie, so we cannot trust this information. We also know that Avery privately told Benjamin that the cherry is in the blue_crate. Since Avery exited the master_bedroom after Jackson, Benjamin can trust Avery more than Jackson. Therefore, we can assume that the cherry is in the blue_crate. The answer is option K. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_4/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..400a4c5cfbe8d9e029bc68b77620c47dbc433bbc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_4/order_1.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Jackson really think the cherry is? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: To solve this question, we need to follow the movements and private interactions of Jackson. According to the story, Jackson entered the master_bedroom with Benjamin, Avery, Abigail, and Mila. He made no movements and stayed in the room for 1 minute before exiting. Then, he entered the waiting_room with the others. + +In the waiting_room, Avery privately told Benjamin that the cherry is in the blue_crate, but we don't know if Jackson overheard this conversation. However, we do know that Jackson privately told Abigail that the cherry is in the green_bucket. + +Based on assumption (3), we know that what Jackson tells Abigail doesn't necessarily reflect his actual thought. Therefore, we cannot conclude that Jackson really thinks the cherry is in the green_bucket. + +However, based on assumption (4), we know that Jackson tends to trust agents who exited the room later than himself. Since Abigail exited the master_bedroom after Jackson, he may be more likely to trust her. Therefore, we can infer that Jackson may think the cherry is in the green_bucket, which is what he told Abigail privately. + +Therefore, the answer is L. green_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_4/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7c725ed713e985fa3970a1927ea161c4c7636a6e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_4/order_2.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Benjamin think Jackson thinks the cherry is? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: To answer this question, we need to track the movements and private interactions of Benjamin and Jackson. We know that both Benjamin and Jackson entered the master_bedroom and stayed there for 1 minute without making any movements. Then, they both exited the room. After that, they both entered the waiting_room where Avery privately told Benjamin that the cherry is in the blue_crate and Jackson privately told Abigail that the cherry is in the green_bucket. + +Based on the assumption that an agent tends to trust an agent that exited the room later than himself, we can assume that Benjamin trusts Jackson more than Abigail. Therefore, Benjamin is more likely to believe Jackson's claim about the location of the cherry. + +According to Jackson's private claim, the cherry is in the green_bucket, which is option L. Therefore, the answer is L. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_4/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9376c5c957e423296330e065c3433c023308dd24 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_4/order_3.txt @@ -0,0 +1,32 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Mila think Benjamin thinks Jackson thinks the cherry is? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: The question is asking about Mila's thoughts on Benjamin's thoughts on Jackson's thoughts about the location of the cherry. To solve this, we need to track the information given about the cherry's location and the private conversations between Avery and Benjamin, and Jackson and Abigail. + +From step 2, we know that the cherry is in the green_bucket. In step 15, Jackson tells Abigail that the cherry is in the green_bucket. However, we also know that every agent tends to lie, so we cannot trust Jackson's statement. + +In step 14, Avery privately tells Benjamin that the cherry is in the blue_crate. We cannot trust this statement either, but we can use it to infer Benjamin's thoughts. If Benjamin believed Avery's statement, he would think the cherry is in the blue_crate. However, if he did not believe Avery, he would still think the cherry is in the green_bucket. + +Mila was the last to exit the master_bedroom, so she would tend to trust the thoughts of agents who exited after her. Avery exited before Mila, so Mila would not trust Avery's statement about the cherry's location. However, Jackson exited after Mila, so she would tend to trust his thoughts more. + +Therefore, Mila would think that Benjamin thinks Jackson thinks the cherry is in the green_bucket, since that is where the cherry actually is and Jackson's statement aligns with that. The answer is L. green_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_4/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f9eb0032dedd50e9a6c3e23e553a24b083481a5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_4/order_4.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Abigail think Mila thinks Benjamin thinks Jackson thinks the cherry is? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Abigail thinks that the cherry is in the green_bucket, based on what Jackson told her. +2. Jackson told Abigail that the cherry is in the green_bucket, but we don't know if he is telling the truth or lying. +3. Benjamin did not make any movements in the master_bedroom, so he did not see where the cherry is. +4. Avery privately told Benjamin that the cherry is in the blue_crate, but we don't know if he is telling the truth or lying. +5. Mila did not make any movements in the master_bedroom, so she did not see where the cherry is. +6. Mila did not have any private or public interactions with Benjamin, so she does not know what he thinks about the cherry's location. +7. Abigail did not have any private or public interactions with Mila, so she does not know what Mila thinks about the cherry's location. +8. Abigail did not have any private or public interactions with Benjamin, so she does not know what he thinks about the cherry's location. +9. Jackson told Abigail that the cherry is in the green_bucket, but we don't know if he is telling the truth or lying. +10. Based on assumption (4), Abigail tends to trust agents who exited the room later than herself. Mila exited the master_bedroom after Abigail, so Abigail may be more likely to trust Mila's thoughts about the cherry's location. + +Putting all of this together, we can conclude that Abigail thinks Mila thinks Benjamin thinks the cherry is in the blue_crate (option K). This is based on the fact that Abigail trusts Mila's thoughts more than Benjamin's (since Mila exited the room after Abigail), and Avery told Benjamin that the cherry is in the blue_crate (although we don't know if this is true or false). \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_5/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..565c6f764a98252073c6c51f250a506919a9a7bf --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_5/order_0.txt @@ -0,0 +1,62 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where is the asparagus really? +Answer: blue_drawer +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: To solve this question, we need to follow the movements of each agent and their interactions. + +1. Elizabeth dislikes the orange. (This information is not relevant to the question.) + +2. Hannah, Emma, Elizabeth, Sophia, and Logan entered the garage. + +3. The asparagus is in the blue_drawer. + +4. Hannah made no movements and stayed in the garage for 1 minute. + +5. Hannah exited the garage. + +6. Emma made no movements and stayed in the garage for 1 minute. + +7. Emma exited the garage. + +8. Elizabeth made no movements and stayed in the garage for 1 minute. + +9. Elizabeth exited the garage. + +10. Sophia made no movements and stayed in the garage for 1 minute. + +11. Sophia exited the garage. + +12. Logan made no movements and stayed in the garage for 1 minute. + +13. Logan saw a dog. + +14. Logan exited the garage. + +15. Hannah, Emma, Elizabeth, Sophia, and Logan entered the waiting_room. + +16. Sophia publicly claimed that asparagus is in the red_crate. + +17. Logan privately told Hannah that the asparagus is in the blue_drawer. + +Based on the assumption that agents tend to lie, we cannot trust Sophia's public claim that the asparagus is in the red_crate. However, we can trust Logan's private communication with Hannah that the asparagus is in the blue_drawer since they were in the same place and had a private interaction. Therefore, the answer is L. blue_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_5/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0cc2d056df9b665b7202e076b4c817e039f11dfc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_5/order_1.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Logan really think the asparagus is? +Answer: blue_drawer +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: To answer this question, we need to look at the actions and interactions of Logan. According to the story, Logan saw a dog after staying in the garage for a minute and then exited the garage. Later, Logan privately told Hannah that the asparagus is in the blue_drawer. Therefore, Logan really thinks that the asparagus is in the blue_drawer. The answer is L. blue_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_5/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..12a0229c91536a5e1fbd7b927d1b42789f2241c7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_5/order_2.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Sophia think Logan thinks the asparagus is? +Answer: red_crate +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: To answer this question, we need to track the movements and interactions of Sophia and Logan. We know that Sophia publicly claimed that the asparagus is in the red_crate, but we also know that Logan privately told Hannah that the asparagus is in the blue_drawer. Since Logan saw a dog and exited the garage before Sophia made her claim, we can assume that Logan is the agent that Sophia trusts the most based on assumption (4). Therefore, Sophia likely thinks that Logan thinks the asparagus is in the blue_drawer, which is option L. So the answer is L. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_5/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b15611999cdd636aec3c8f7e74b852e2df246db9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_5/order_3.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Elizabeth think Sophia thinks Logan thinks the asparagus is? +Answer: blue_drawer +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: This question requires a lot of attention to detail and inference. Let's break it down step by step: + +1. Where does Elizabeth think Sophia thinks the asparagus is? +We need to determine Elizabeth's belief about Sophia's belief about the location of the asparagus. + +2. What does Sophia publicly claim about the location of the asparagus? +We know from step 16 that Sophia publicly claimed that the asparagus is in the red_crate. + +3. Does Elizabeth trust Sophia's claim? +We don't know for sure, but we do know that Elizabeth dislikes the orange and has not made any movements in the garage. This information doesn't directly relate to the question, but it's important to keep in mind. + +4. What does Logan privately tell Hannah about the location of the asparagus? +We know from step 17 that Logan privately told Hannah that the asparagus is in the blue_drawer. + +5. Does Elizabeth trust Logan's claim? +We know from assumption (4) that Elizabeth is more likely to trust Logan's claim because he exited the garage after her. + +6. Where does Sophia think the asparagus is? +We don't know for sure, but we do know that she publicly claimed it's in the red_crate. It's possible that she actually believes this, or she could be lying. + +7. What does Elizabeth think Logan thinks about the location of the asparagus? +We don't know for sure, but we do know that Logan privately told Hannah it's in the blue_drawer. It's possible that Elizabeth believes this, or she could have a different belief. + +Putting all of this together, we can make an educated guess about the answer. Elizabeth trusts Logan's claim more than Sophia's claim, so it's likely that she believes the asparagus is in the blue_drawer. Sophia publicly claimed it's in the red_crate, but we don't know if she actually believes this or if she's lying. Therefore, we can't be sure what Elizabeth thinks Sophia thinks about the location of the asparagus. However, we do know that Elizabeth thinks Logan thinks it's in the blue_drawer. So the answer is L. blue_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_5/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..826c72459f383d0475adf920681a7f74e077b3ff --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_5/order_4.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Hannah think Elizabeth thinks Sophia thinks Logan thinks the asparagus is? +Answer: blue_drawer +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: This question requires a lot of inference based on the given assumptions. Let's break it down step by step: + +1. Hannah privately knows that the asparagus is in the blue_drawer (from Logan's private communication). +2. Elizabeth made no movements in the garage and therefore did not see the location of the asparagus. +3. Sophia publicly claimed that the asparagus is in the red_crate, but we know that agents tend to lie. +4. Logan saw a dog and therefore did not see the location of the asparagus. +5. Hannah exited the garage before Emma, Elizabeth, Sophia, and Logan, so she trusts their information less than her own knowledge of the asparagus location. +6. Therefore, Hannah thinks that Elizabeth thinks the asparagus is not in the red_crate (since Sophia's claim is public and therefore not trustworthy), but she does not know where Elizabeth thinks the asparagus is. +7. Since Hannah trusts her own knowledge of the asparagus location, she thinks that Sophia and Logan's thoughts on the location are not trustworthy. +8. Therefore, Hannah does not think that Elizabeth thinks Sophia or Logan's thoughts on the asparagus location are trustworthy. +9. We do not have any information on where Hannah thinks Elizabeth thinks the asparagus is, so the answer is unknown. + +Answer: Unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_6/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1ca42644107fc3762c03349fa2c8f5ba466255fb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_6/order_0.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where is the watermelon really? +Answer: green_basket +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: To solve this question, we need to follow the movements of the watermelon and the private conversations between the agents. + +1. Owen moved the watermelon to the green_envelope. +2. Jacob moved the watermelon to the green_bucket. +3. Emma moved the watermelon to the blue_pantry. +4. William moved the watermelon to the green_basket. + +After all the agents exited the sunroom, Emma privately told Owen that the watermelon is in the green_bucket, and Jacob privately told William that the watermelon is in the green_envelope. + +We know that every agent tends to lie, so we cannot trust their public claims. However, we can use the exit order to determine who to trust. William exited the sunroom after Jacob, so we can trust his private conversation with Jacob. Therefore, we know that the watermelon is in the green_envelope. + +The answer is B. green_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_6/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b3673f3af21a8d31a40f1a65c83da382a625331 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_6/order_1.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does William really think the watermelon is? +Answer: green_basket +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: To answer this question, we need to consider the private conversation between Jacob and William. Jacob told William that the watermelon is in the green_envelope, but we know from the story that Jacob moved the watermelon to the green_bucket before he left the sunroom. Therefore, Jacob lied to William about the location of the watermelon. We also know that Emma privately told Owen that the watermelon is in the green_bucket, which is the true location of the watermelon. Since William exited the sunroom after Jacob, he would tend to trust Jacob's claim less than Emma's claim. Therefore, William really thinks that the watermelon is in the green_bucket. The answer is D. green_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_6/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..08b15b26327422b635044b47b9d50ae333af6cf3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_6/order_2.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does Carter think William thinks the watermelon is? +Answer: green_basket +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: To answer this question, we need to track the movements of the watermelon and the interactions between the agents. We know that Carter was in the sunroom with Owen, Jacob, Emma, and William. Carter made no movements and stayed in the sunroom for 1 minute before exiting. Owen, Jacob, Emma, William, and Carter then entered the waiting room. Emma privately told Owen that the watermelon is in the green_bucket, and Jacob privately told William that the watermelon is in the green_envelope. + +Since Carter did not move the watermelon and did not have any private interactions with William, he only knows the public claims made by Emma and Jacob. We also know that agents tend to lie, so we cannot trust their public claims. However, we can use the exit order to determine who Carter might trust more. + +Carter exited the sunroom after William, so he might trust William's claim more than Emma's claim. Therefore, Carter might think that William thinks the watermelon is in the green_envelope, which is the location that Jacob told William. The answer is B. green_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_6/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..53032d696d02a16b58f03cced3c6c681b986ecd3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_6/order_3.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does Owen think Carter thinks William thinks the watermelon is? +Answer: green_envelope +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To solve this question, we need to track the movements of the watermelon and the agents' interactions. + +First, Owen moved the watermelon from the green_crate to the green_envelope before exiting the sunroom. Then, Jacob moved the watermelon from the green_envelope to the green_bucket before exiting the sunroom. Emma moved the watermelon from the green_bucket to the blue_pantry before exiting the sunroom. Finally, William moved the watermelon from the blue_pantry to the green_basket before exiting the sunroom. + +After all the agents exited the sunroom, Emma privately told Owen that the watermelon is in the green_bucket, and Jacob privately told William that the watermelon is in the green_envelope. + +We need to determine where Owen thinks Carter thinks William thinks the watermelon is. Since Carter made no movements and stayed in the sunroom for 1 minute, he did not have any private interactions with any other agents. Therefore, Owen cannot infer Carter's thoughts directly. + +However, Owen knows that Emma told him the truth about the watermelon being in the green_bucket. Since Emma exited the sunroom before William, Owen can trust William's claim about the watermelon being in the green_envelope. + +Therefore, Owen thinks that Carter thinks William thinks the watermelon is in the green_envelope. + +The answer is B. green_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_6/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..021164a42341df7b80dd45b76d5e431cf3c9173a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_6/order_4.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does Emma think Owen thinks Carter thinks William thinks the watermelon is? +Answer: green_envelope +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: This question requires a lot of steps to solve. Let's break it down: + +1. Emma privately told Owen that the watermelon is in the green_bucket. +2. We need to find where Emma thinks Owen thinks Carter thinks William thinks the watermelon is. + +To solve this question, we need to work backwards. We know that Emma thinks the watermelon is in the green_bucket because she privately told Owen. We also know that Owen moved the watermelon to the green_envelope before he exited the sunroom. Therefore, Owen does not think the watermelon is in the green_bucket. + +Next, we need to figure out where Owen thinks Carter thinks the watermelon is. We know that Carter made no movements and stayed in the sunroom for 1 minute before he exited. Therefore, he does not know where the watermelon is. However, Owen trusts Carter because he exited the sunroom after him. Therefore, Owen might think that Carter knows where the watermelon is. + +Now, we need to figure out where Carter might think the watermelon is. Since he made no movements, he does not know where the watermelon is. However, he might trust William because William exited the sunroom after him. Therefore, Carter might think that William knows where the watermelon is. + +Finally, we need to figure out where William thinks the watermelon is. We know that Jacob privately told William that the watermelon is in the green_envelope. However, we cannot trust Jacob's claim because he might be lying. Therefore, we need to look at the movements of the watermelon. We know that Owen moved the watermelon to the green_envelope before he exited the sunroom. Therefore, William might think that the watermelon is in the green_envelope. + +Putting it all together, Emma thinks that Owen thinks that Carter thinks that William thinks the watermelon is in the green_envelope. Therefore, the answer is B. green_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_7/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7ce0b36e47372ff7f32288c282358bfd4ff4da4d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_7/order_0.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where is the tomato really? +Answer: green_drawer +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: To solve this question, we need to track the movements and statements of each agent regarding the tomato's location. + +- Emma saw a cat and made no movements in the study. +- Hannah made no movements in the study. +- Carter dislikes the banana and made no movements in the study. +- Liam moved the tomato to the green_drawer and then exited the study. +- Nathan made no movements in the study and publicly claimed that the tomato is in the blue_bottle. +- Carter privately told Emma that the tomato is in the green_drawer. + +Based on this information, we can eliminate some options. The tomato cannot be in the blue_bathtub, red_drawer, green_bathtub, green_envelope, blue_cupboard, green_box, blue_treasure_chest, red_bottle, green_pantry, green_bucket, or blue_drawer because there is no mention of these locations in the story. + +The tomato could be in the red_container or the green_drawer. Nathan publicly claimed that the tomato is in the blue_bottle, but we know that agents tend to lie. Carter privately told Emma that the tomato is in the green_drawer, but we don't know if Carter is telling the truth or lying. + +However, we can use the assumption that agents tend to trust agents who exited the room later than themselves. Liam exited the study after Carter, Nathan, Hannah, and Emma. Therefore, Liam is the last agent to exit the study and the other agents may trust him more. Liam moved the tomato to the green_drawer before exiting the study. Therefore, the tomato is most likely in the green_drawer. + +The answer is N. green_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_7/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..de2c73f5a827f803a686bbbd46cd7c0bf01128ab --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_7/order_1.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Emma really think the tomato is? +Answer: green_drawer +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: To answer this question, we need to look for any information related to Emma's thoughts about the location of the tomato. According to the story, Emma saw a cat and made no movements in the study for 1 minute before exiting. There is no information about Emma's thoughts or any interaction with other agents regarding the location of the tomato. Therefore, we cannot determine where Emma really thinks the tomato is based on the given information. The answer is not provided in the options given. The correct answer is "Cannot be determined." \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_7/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c2caa550904891e8611b1a442b2aa2816e9cb55a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_7/order_2.txt @@ -0,0 +1,28 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Liam think Emma thinks the tomato is? +Answer: red_container +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: The question is asking about Liam's thoughts on where Emma thinks the tomato is. To answer this question, we need to track Emma's movements and interactions with other agents. Emma saw a cat and made no movements in the study for 1 minute before exiting. Therefore, she did not move the tomato to the green_drawer. Liam moved the tomato to the green_drawer and then exited the study. Nathan publicly claimed that the tomato is in the blue_bottle, but we know that Nathan tends to lie. Carter privately told Emma that the tomato is in the green_drawer, but we don't know if Emma believes him or not. + +Since Emma did not move the tomato and Liam moved it to the green_drawer, it is likely that Liam thinks Emma believes the tomato is in the green_drawer. Therefore, the answer is N. green_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_7/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..290dd2c9704dfab3b05825eebed24f2520eda2bc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_7/order_3.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Hannah think Liam thinks Emma thinks the tomato is? +Answer: red_container +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: To answer this question, we need to track the movements and interactions of Hannah, Liam, and Emma regarding the tomato. + +- Emma saw the cat and made no movements in the study. +- Liam moved the tomato to the green_drawer and then exited the study. +- Hannah made no movements in the study. +- Nathan made no movements in the study. +- Carter made no movements in the study and privately told Emma that the tomato is in the green_drawer. + +Since Hannah made no movements in the study, she doesn't have any direct knowledge of where the tomato is. However, she knows that Liam moved the tomato to the green_drawer and that Carter told Emma that the tomato is in the green_drawer. + +Therefore, Hannah thinks that Liam thinks Emma thinks the tomato is in the green_drawer. + +The answer is N. green_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_7/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e8a6b220aa3e3332b75fbe64652182e2116bf885 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_7/order_4.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Carter think Hannah thinks Liam thinks Emma thinks the tomato is? +Answer: red_container +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Carter think the tomato is? +According to the story, Carter privately told Emma that the tomato is in the green_drawer. Therefore, we know that Carter thinks the tomato is in the green_drawer. + +2. Where does Liam think the tomato is? +We know from the story that Liam moved the tomato to the green_drawer. Therefore, Liam thinks the tomato is in the green_drawer. + +3. Where does Hannah think Liam thinks the tomato is? +We don't have any direct information about where Hannah thinks the tomato is. However, we know that Hannah was in the study with Liam and saw him move the tomato to the green_drawer. Therefore, she has reason to believe that the tomato is in the green_drawer. We can assume that Hannah thinks Liam thinks the tomato is in the green_drawer. + +4. Where does Emma think Hannah thinks Liam thinks the tomato is? +We don't have any direct information about where Emma thinks the tomato is. However, we know that Emma saw a cat in the study and made no movements while she was there. Therefore, she did not see Liam move the tomato to the green_drawer. We can assume that Emma does not know where the tomato is and cannot make an informed guess about where Hannah thinks Liam thinks the tomato is. + +5. Where does Carter think Hannah thinks Liam thinks Emma thinks the tomato is? +This is the most complex part of the question. We know that Carter thinks the tomato is in the green_drawer and Liam thinks the tomato is in the green_drawer. We can assume that Hannah thinks Liam thinks the tomato is in the green_drawer. However, we don't have any direct information about what Emma thinks. Therefore, we cannot make an informed guess about what Hannah thinks Liam thinks Emma thinks. + +Based on this analysis, we can eliminate answer choices that are not related to the green_drawer: A, B, E, K, L, O. We can also eliminate answer choices that are not related to Hannah's thoughts: F, G, H, I, J, M. This leaves us with answer choice N, which is the green_drawer. Therefore, Carter thinks Hannah thinks Liam thinks Emma thinks the tomato is in the green_drawer. The answer is N. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_8/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fdd61b5fb2c0d75bb7146dbb2cdffcea36dbecb3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_8/order_0.txt @@ -0,0 +1,27 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where is the lettuce really? +Answer: red_bucket +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: To answer this question, we need to follow the movements of each agent and their private interactions. According to the story, the lettuce was initially in the red_bucket in the living_room. Sophia moved it to the red_box before exiting the living_room. Isla and Benjamin made no movements and stayed in the living_room for 1 minute each before exiting. Alexander moved the lettuce to the red_pantry before exiting, and Emily moved it back to the red_bucket before exiting. Benjamin privately told Sophia that the lettuce is in the red_bucket, and Isla privately told Alexander that the lettuce is in the red_pantry. + +Based on this information, we can conclude that the lettuce is actually in the red_bucket, as confirmed by Benjamin's private communication with Sophia. Therefore, the correct answer is K. red_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_8/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..324b1ad8b593c96516bdc3dd1127115acbce9a7c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_8/order_1.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Isla really think the lettuce is? +Answer: red_box +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: To answer this question, we need to look at the actions and private interactions of Isla. Isla made no movements in the living_room and stayed there for 1 minute. Isla then exited the living_room and privately told Alexander that the lettuce is in the red_pantry. Isla did not have any private interactions with Sophia or Benjamin, so we cannot infer their thoughts. However, we know that Isla trusts Alexander more than Benjamin because Alexander exited the living_room after Benjamin. Therefore, we can assume that Isla's private claim to Alexander is more likely to be truthful. Based on this information, the answer is L. red_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_8/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..cadb38e293ca8fb025d78255332281ba47070c94 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_8/order_2.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Benjamin think Isla thinks the lettuce is? +Answer: red_box +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: The question is asking about Benjamin's thoughts about Isla's thoughts regarding the location of the lettuce. To answer this question, we need to look at the actions and interactions of Benjamin and Isla in the story. Isla privately told Alexander that the lettuce is in the red_pantry, but we don't know if Benjamin overheard this conversation. However, we do know that Benjamin privately told Sophia that the lettuce is in the red_bucket. Since Benjamin exited the living_room after Isla, he would trust Isla's information if he heard it. Therefore, Benjamin would think that Isla also believes the lettuce is in the red_pantry. The answer is L. red_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_8/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f25dbc8b681916e7f99e1de40a8da0a574a8e957 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_8/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Sophia think Benjamin thinks Isla thinks the lettuce is? +Answer: red_box +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: To answer this question, we need to track the movements and private interactions of Sophia, Benjamin, and Isla. + +1. Sophia moved the lettuce from the red_bucket to the red_box before leaving the living_room. +2. Isla made no movements and stayed in the living_room for 1 minute before leaving. +3. Benjamin made no movements and stayed in the living_room for 1 minute before leaving. +4. Alexander moved the lettuce from the red_box to the red_pantry before leaving. +5. Emily moved the lettuce from the red_pantry back to the red_bucket before leaving. +6. Benjamin privately told Sophia that the lettuce is in the red_bucket. +7. Isla privately told Alexander that the lettuce is in the red_pantry. + +Based on these movements and interactions, we know that Sophia knows the lettuce is in the red_bucket because she moved it there herself. Benjamin told Sophia that the lettuce is in the red_bucket, but we don't know if he actually believes that or if he's lying. Isla lost his phone and made no movements related to the lettuce. + +So, where does Sophia think Benjamin thinks Isla thinks the lettuce is? We don't have any direct information about what Benjamin thinks, but we can make some educated guesses based on the available information. + +If Benjamin is lying to Sophia about the lettuce being in the red_bucket, then Sophia might think that Benjamin thinks Isla knows the lettuce is actually in a different location. However, we don't have any information to suggest that Isla actually knows where the lettuce is. + +If Benjamin is telling the truth about the lettuce being in the red_bucket, then Sophia might think that Benjamin believes Isla also knows the lettuce is in the red_bucket. However, we don't have any information to suggest that Isla actually knows where the lettuce is. + +Overall, we don't have enough information to confidently answer this question. The best answer would be "insufficient information." \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_8/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..12fcadf2c29756fa5f54b71f258d45998d429766 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_8/order_4.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Emily think Sophia thinks Benjamin thinks Isla thinks the lettuce is? +Answer: red_box +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: The question is asking about Emily's thoughts regarding the location of the lettuce according to the thoughts of Sophia, Benjamin, and Isla. To solve this, we need to track the movements and interactions of these agents. + +1. Sophia moved the lettuce to the red_box before exiting the living_room. +2. Isla made no movements and stayed in the living_room for 1 minute before exiting. +3. Benjamin made no movements and stayed in the living_room for 1 minute before exiting. +4. Alexander moved the lettuce to the red_pantry before exiting the living_room. +5. Emily moved the lettuce to the red_bucket before exiting the living_room. +6. Benjamin privately told Sophia that the lettuce is in the red_bucket. +7. Isla privately told Alexander that the lettuce is in the red_pantry. + +Based on these movements and interactions, we can infer the following: + +- Sophia knows that the lettuce was initially in the red_bucket, but she moved it to the red_box before leaving the living_room. +- Benjamin knows that the lettuce is in the red_bucket because Isla told him. +- Isla knows that the lettuce is in the red_pantry because Alexander told him. +- Alexander knows that the lettuce is in the red_pantry because he moved it there himself. +- Emily knows that the lettuce is in the red_bucket because she moved it there herself. + +Now we need to determine where Emily thinks Sophia thinks Benjamin thinks Isla thinks the lettuce is. + +- Emily knows that the lettuce is in the red_bucket. +- Sophia knows that the lettuce was initially in the red_bucket, but she moved it to the red_box. +- Benjamin knows that the lettuce is in the red_bucket because Isla told him. +- Isla knows that the lettuce is in the red_pantry because Alexander told him. + +Therefore, Emily thinks that Sophia thinks that Benjamin thinks that the lettuce is in the red_bucket. + +The answer is K. red_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_9/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8e65877098e46e8d108eb7b12fe651f963cf7be2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_9/order_0.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where is the spinach really? +Answer: blue_suitcase +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To solve this question, we need to track the movements of the agents and their public and private claims. According to the story and assumptions, we know that Abigail, Owen, Amelia, Jack, and Aiden all entered the laundry together. Abigail made no movements and stayed in the laundry for 1 minute before exiting. Owen moved the spinach from the blue suitcase to the red basket before exiting. Amelia made no movements and stayed in the laundry for 1 minute before exiting. Jack moved the spinach from the red basket to the green pantry before exiting. Aiden moved the spinach from the green pantry to the blue suitcase before exiting. + +After leaving the laundry, all five agents entered the waiting room. Amelia publicly claimed that the spinach is in the red container, but we know that agents tend to lie and what they say doesn't necessarily reflect their actual thoughts. Aiden privately told Amelia that the spinach is in the blue suitcase, which means that he knows where the spinach really is. + +Based on the movements of the agents, we can conclude that the spinach is in the blue suitcase (option F). Therefore, the answer is F. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_9/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..70775bff4c70dad4d31444ddc15f0f44e79a1230 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_9/order_1.txt @@ -0,0 +1,29 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Abigail really think the spinach is? +Answer: red_container +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: To answer this question, we need to track Abigail's movements and interactions with other agents. Abigail entered the laundry with Owen, Amelia, Jack, and Aiden. She made no movements and stayed in the laundry for 1 minute before exiting. During her time in the laundry, Owen moved the spinach to the red_basket, and Jack later moved it to the green_pantry. Abigail dislikes the lemon, but there is no mention of her having any interaction with the spinach. + +In the waiting_room, Amelia publicly claimed that the spinach is in the red_container, but Aiden privately told her that it is in the blue_suitcase. Abigail was present for both of these interactions, but there is no mention of her making any claims or having any private conversations about the spinach. + +Based on this information, we cannot determine where Abigail really thinks the spinach is. She did not interact with the spinach in the laundry, and there is no mention of her making any claims or having any private conversations about it in the waiting_room. Therefore, the answer is unknown and cannot be determined from the given information. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_9/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..da5c43fa72cc45019c5a7046ee9e764ff1fd3d34 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_9/order_2.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Owen think Abigail thinks the spinach is? +Answer: blue_suitcase +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to track where the spinach was moved by each agent and who had interactions with whom. + +- Abigail entered the laundry and made no movements, so she did not move the spinach. +- Owen moved the spinach from the blue suitcase to the red basket. +- Amelia entered the laundry and made no movements, so she did not move the spinach. +- Jack moved the spinach from the red basket to the green pantry. +- Aiden moved the spinach from the green pantry to the blue suitcase. + +After all the agents exited the laundry, Amelia publicly claimed that the spinach is in the red container, but Aiden privately told Amelia that the spinach is in the blue suitcase. + +Since Owen moved the spinach to the red basket and did not have any interactions with Abigail, we cannot determine where Owen thinks Abigail thinks the spinach is based on the given information. Therefore, the answer is not provided in the options given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_9/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8c62a7bddc4ea093069a31c6f7bad4d39e599812 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_9/order_3.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Aiden think Owen thinks Abigail thinks the spinach is? +Answer: blue_suitcase +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to trace the movements of each agent and their interactions. + +1. Abigail, Owen, Amelia, Jack, and Aiden entered the laundry. +2. The spinach is in the blue_suitcase. +3. Abigail made no movements and stayed in the laundry for 1 minute. +4. Abigail exited the laundry. +5. Owen moved the spinach to the red_basket. +6. Owen exited the laundry. +7. Amelia made no movements and stayed in the laundry for 1 minute. +8. Amelia exited the laundry. +9. Jack moved the spinach to the green_pantry. +10. Abigail dislikes the lemon. +11. Jack exited the laundry. +12. Aiden moved the spinach to the blue_suitcase. +13. Aiden exited the laundry. +14. Abigail, Owen, Amelia, Jack, and Aiden entered the waiting_room. +15. Amelia publicly claimed that spinach is in the red_container. +16. Aiden privately told Amelia that the spinach is in the blue_suitcase. + +Based on the assumption that agents tend to trust those who exited the room later than themselves, we know that Aiden trusts Amelia's claim that the spinach is in the red_container. However, we need to determine where Aiden thinks Owen thinks Abigail thinks the spinach is. + +We know that Owen moved the spinach to the red_basket, but we don't know if he shared this information with anyone. Abigail made no movements and dislikes lemon, so we can assume she doesn't know where the spinach is. Jack moved the spinach to the green_pantry, so he knows where it is, but we don't know if he shared this information with anyone. + +Therefore, the only information we have to go on is that the spinach is in the blue_suitcase, which Aiden knows. We also know that Aiden privately told Amelia this information. + +So, where does Aiden think Owen thinks Abigail thinks the spinach is? We don't have enough information to determine this. The answer cannot be determined from the given information. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_9/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a5d3611308b2fb06074b6a0dc83aa8f045749c93 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_1/sample_9/order_4.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Jack think Aiden thinks Owen thinks Abigail thinks the spinach is? +Answer: blue_suitcase +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: This is a complex question that requires breaking down the thought process of each character. + +First, we need to determine where the spinach actually is. According to the story, Aiden moved the spinach to the blue suitcase. + +Next, we need to determine who knows where the spinach is. Aiden privately told Amelia that the spinach is in the blue suitcase. Amelia publicly claimed that the spinach is in the red container. This means that Amelia is lying about the location of the spinach. + +Now, we need to determine what each character thinks about the location of the spinach. Abigail made no movements and stayed in the laundry for 1 minute, so we don't know what she thinks. Owen moved the spinach to the red basket, so he knows that it's not in the blue suitcase. Jack moved the spinach to the green pantry, so he also knows that it's not in the blue suitcase. + +Finally, we need to determine where Jack thinks Aiden thinks Owen thinks Abigail thinks the spinach is. Since Jack knows that the spinach is not in the blue suitcase, he knows that Aiden must also know this. Therefore, Aiden cannot think that Abigail thinks the spinach is in the blue suitcase. Owen moved the spinach to the red basket, so he knows that it's not in the blue suitcase. Therefore, Owen cannot think that Abigail thinks the spinach is in the blue suitcase. Abigail made no movements, so we don't know what she thinks. Therefore, Jack must think that Aiden thinks that Abigail thinks the spinach is in the blue suitcase. + +The answer is F. blue suitcase. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_1/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..197873fe3d2537ff20aca9b5a90d0867b3afecaf --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_1/order_0.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where is the persimmon really? +Answer: green_drawer +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: To answer this question, we need to track the movements of the persimmon and the agents. According to the story, the persimmon was initially in the blue_pantry (statement 2). Aiden moved it to the green_treasure_chest (statement 7), and then Amelia moved it to the blue_pantry (statement 11) before finally moving it to the green_drawer (statement 18). + +Ella publicly claimed that the persimmon is in the blue_bottle (statement 26), but we know that the agents tend to lie (assumption 3). Additionally, Amelia privately told Ella that the persimmon is in the red_box (statement 27). + +Based on the movements of the persimmon and the private conversation between Amelia and Ella, we can conclude that the persimmon is actually in the red_box (statement 27) and not in the blue_bottle as claimed by Ella. Therefore, the answer is H. red_box. + +a: 5 7 6 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_1/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cd441c244c0fc0e06882c54474ac05c3fb6a7d79 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_1/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Owen really think the persimmon is? +Answer: blue_bottle +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bottle +GPT-4 Explain: To answer this question, we need to look at the movements and interactions of Owen and other agents related to the persimmon. According to the story, Owen made no movements in the closet and stayed there for 1 minute before exiting. Aiden moved the persimmon from the blue_pantry to the green_treasure_chest before exiting the closet. Amelia moved the persimmon from the blue_pantry to the green_drawer before exiting the closet. Ella publicly claimed that the persimmon is in the blue_bottle, but Amelia privately told Ella that the persimmon is in the red_box. + +Based on these movements and interactions, we can eliminate some options. Owen did not move the persimmon, so options A, C, E, L, and O can be eliminated. There is no mention of Owen interacting with Ella or Amelia, so options B, D, K, M, and N can also be eliminated. + +That leaves us with two options: green_drawer and red_box. Amelia moved the persimmon to the green_drawer, but she also told Ella that the persimmon is in the red_box. Since Owen exited the closet after Aiden and before Amelia, he may be more likely to trust Amelia's private claim over Ella's public claim. Therefore, Owen may really think that the persimmon is in the red_box. + +The answer is H. red_box. + +a: 5 6 7 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_1/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..09de6be34879da4cee6b0979b6907a1aed57190a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_1/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Amelia think Owen thinks the persimmon is? +Answer: blue_pantry +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: To answer this question, we need to track where the persimmon has been moved throughout the story and who has interacted with it. From the story, we know that the persimmon was initially in the blue_pantry, then moved to the green_treasure_chest by Aiden, then to the blue_pantry by Amelia, and finally to the green_drawer by Amelia. + +We also know that Owen made no movements and stayed in the closet for 1 minute, so he did not interact with the persimmon. Therefore, Amelia would not have any information about where Owen thinks the persimmon is based on her interactions with it. + +The answer is none of the above, as Amelia does not have any information about where Owen thinks the persimmon is. + +a: 5 6 7 4 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_1/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b1d70bac687f4690bcb77bfb48a149eecc4262bd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_1/order_3.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Aiden think Amelia thinks Owen thinks the persimmon is? +Answer: blue_pantry +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: First, we need to determine where Amelia thinks the persimmon is. According to assumption (2), Aiden can only infer Amelia's thought if they have been in the same place or had a private interaction. From the story, we know that Amelia moved the persimmon to the green_drawer (step 18) and privately told Ella that the persimmon is in the red_box (step 27). Therefore, we can conclude that Amelia thinks the persimmon is in the red_box. + +Next, we need to determine where Owen thinks the persimmon is. We don't have any direct information about Owen's thoughts, but we can use assumption (4) to make an inference. Since Owen exited the closet before Aiden, Aiden is more likely to trust Owen's judgment. From step 5, we know that Owen made no movements and stayed in the closet for 1 minute. Therefore, we can assume that Owen did not see the persimmon being moved and still thinks it is in the blue_pantry (step 2). + +Finally, we can answer the question. Aiden thinks that Amelia thinks Owen thinks the persimmon is in the blue_pantry (answer choice G), since Owen has not seen the persimmon being moved and Aiden knows that Amelia thinks it is in the red_box. + +a: 4 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_1/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..db4c61b2540a4535656cfb1e6e9aad269266a274 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_1/order_4.txt @@ -0,0 +1,78 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Ella think Aiden thinks Amelia thinks Owen thinks the persimmon is? +Answer: blue_pantry +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Ella publicly claimed that persimmon is in the blue_bottle. This means that Ella thinks the persimmon is in the blue_bottle. + +2. Amelia privately told Ella that the persimmon is in the red_box. This means that Ella knows that Amelia thinks the persimmon is in the red_box. + +3. Aiden saw a monkey. This doesn't seem relevant to the question, so we can ignore it. + +4. Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. This means that all five agents were in the waiting_room at the same time. + +5. Amelia, Aiden and Ella entered the closet. This means that Amelia, Aiden, and Ella were in the closet at the same time. + +6. The persimmon is in the blue_pantry. This means that the persimmon was in the blue_pantry at some point, but we don't know if it's still there. + +7. Amelia moved the persimmon to the green_drawer. This means that Amelia moved the persimmon from wherever it was to the green_drawer. + +8. Aiden moved the persimmon to the green_treasure_chest. This means that Aiden moved the persimmon from the green_drawer to the green_treasure_chest. + +9. Amelia, Aiden and Ella entered the waiting_room. This means that all three agents were in the waiting_room at the same time. + +Based on these steps, we can start to piece together where Ella thinks Aiden thinks Amelia thinks Owen thinks the persimmon is. We know that Ella thinks the persimmon is in the blue_bottle, and that Amelia thinks the persimmon is in the red_box. We also know that Aiden moved the persimmon from the green_drawer to the green_treasure_chest, but we don't know where he thinks the persimmon is. + +To figure out where Ella thinks Aiden thinks Amelia thinks Owen thinks the persimmon is, we need to look for clues about Owen's thoughts. Unfortunately, there are no direct clues about Owen's thoughts in the story. However, we do know that Aiden exited the closet before Ella, and that Ella made no movements and stayed in the closet for 1 minute before exiting. This means that Ella would tend to trust Aiden's thoughts more than her own, and that Aiden would tend to trust his own thoughts more than Ella's. + +Given this information, we can make an educated guess about where Ella thinks Aiden thinks Amelia thinks Owen thinks the persimmon is. Since Ella thinks the persimmon is in the blue_bottle, and Aiden would tend to trust his own thoughts more than Ella's, it's likely that Aiden also thinks the persimmon is in the blue_bottle. Since Amelia thinks the persimmon is in the red_box, and Aiden would tend to trust his own thoughts more than Amelia's, it's likely that Aiden doesn't think the persimmon is in the red_box. This leaves us with the following options: + +- green_bathtub +- green_basket +- red_bottle +- red_container +- green_drawer +- blue_pantry +- red_box +- green_treasure_chest +- red_bucket +- green_pantry +- red_crate +- blue_cupboard +- green_bucket + +Of these options, the only one that matches both Ella's and Aiden's thoughts is the red_bottle. Therefore, we can conclude that Ella thinks Aiden thinks Amelia thinks Owen thinks the persimmon is in the red_bottle. The answer is D. + +a: 4 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_10/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..df9f07efe7d3859aa6bb33fc2efb6e16f359bbcc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_10/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where is the persimmon really? +Answer: green_pantry +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: To answer this question, we need to track the movements of each agent and the location of the persimmon. According to the story, the persimmon was initially in the blue_crate when all five agents entered the bathroom. Charlotte moved it to the red_crate, then Evelyn moved it to the blue_cupboard, and finally, Amelia moved it to the green_pantry. Therefore, the persimmon is in the green_pantry. The answer is K. green_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_10/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b036a525d8c57afb1716e6bdc22a785f5273785 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_10/order_1.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Ava really think the persimmon is? +Answer: blue_crate +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To answer this question, we need to track Ava's movements and the movements of the persimmon. According to the story, Ava did not move the persimmon, but Charlotte, Evelyn, and Amelia did. Benjamin also did not move the persimmon. After all the agents exited the bathroom, they entered the waiting room and then the office. In the office, Ava moved the onion to the green_box, and Benjamin and Evelyn were also present. Benjamin privately told Evelyn that the onion is in the red_container, and Evelyn privately told Amelia that the onion is in the green_box. + +Based on the assumptions given, we know that Ava may not be telling the truth about where she thinks the persimmon is. However, we can infer that she may trust Benjamin's claim about the onion being in the red_container since he exited the office after her. Therefore, Ava may think that the persimmon is in the red_crate, which is the option (N) in the multiple-choice question. + +So the answer is (N) red_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_10/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f2b93c6df85945aafcb941d6f3eb11d576a593dd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_10/order_2.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Evelyn think Ava thinks the persimmon is? +Answer: blue_crate +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To answer this question, we need to track the movements of the agents and their private and public interactions. We know that Ava did not move the persimmon, but Charlotte, Evelyn, and Amelia did. Benjamin did not move anything. Ava, Benjamin, and Evelyn entered the office together, but only Benjamin stayed there for a minute. Then, Benjamin and Evelyn exited the office together. Later, Benjamin privately told Evelyn that the onion is in the red_container, and Evelyn privately told Amelia that the onion is in the green_box. + +Based on these movements and interactions, we can infer that Evelyn trusts Benjamin more than Ava because Benjamin exited the office after her. Therefore, she may believe Benjamin's claim about the onion's location more than Ava's claim about the persimmon's location. We also know that Charlotte moved the persimmon to the red_crate, and Evelyn moved it to the blue_cupboard. Since Evelyn was the last one to move the persimmon and she exited the bathroom before Amelia, she may think that Ava thinks the persimmon is in the blue_cupboard, which is where she left it. + +Therefore, the answer is M. blue_cupboard. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_10/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..91c9c6d052cdfe6b88c5d21c36b65c6b2c8be0ad --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_10/order_3.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Charlotte think Evelyn thinks Ava thinks the persimmon is? +Answer: blue_crate +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: This question requires a lot of logical reasoning and deduction. We need to track the movements of each agent and their interactions with each other to determine where Charlotte thinks Evelyn thinks Ava thinks the persimmon is. + +First, we know that Ava did not move the persimmon and left the bathroom before anyone else. Therefore, she has no idea where the persimmon is. + +Next, Charlotte moved the persimmon to the red_crate before leaving the bathroom. So, she knows that the persimmon is not in the blue_crate anymore. + +Evelyn then moved the persimmon to the blue_cupboard before leaving the bathroom. She knows that the persimmon is not in the red_crate anymore. + +Amelia then moved the persimmon to the green_pantry before leaving the bathroom. She knows that the persimmon is not in the blue_cupboard anymore. + +Finally, Benjamin did not move the persimmon and left the bathroom after everyone else. He knows that the persimmon is not in the green_pantry anymore. + +In the office, Ava moved the onion to the green_box before leaving. Benjamin and Evelyn did not move the onion and left after Ava. Benjamin privately told Evelyn that the onion is in the red_container, but Evelyn privately told Amelia that the onion is in the green_box. + +Based on this information, we can deduce that Charlotte thinks that Evelyn thinks that Ava thinks the persimmon is in the green_box. + +Therefore, the answer is A. green_box. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_10/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e7cca1ed10a05d89b2477c6feb0b3b6aab51b99c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_10/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Benjamin think Charlotte thinks Evelyn thinks Ava thinks the persimmon is? +Answer: blue_crate +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: This question requires a lot of logical reasoning and deduction. We need to trace the path of the persimmon and the agents' movements to determine where Benjamin thinks Charlotte thinks Evelyn thinks Ava thinks the persimmon is. + +First, we know that the persimmon starts in the blue_crate and is moved by Charlotte to the red_crate, then by Evelyn to the blue_cupboard, and finally by Amelia to the green_pantry. Ava does not move the persimmon. + +Next, we know that Ava moves the onion from the blue_bathtub to the green_box, and tells no one where she put it. Benjamin privately tells Evelyn that the onion is in the red_container, but we don't know if he is telling the truth or lying. Evelyn privately tells Amelia that the onion is in the green_box. + +Based on the assumption that agents tend to trust those who exit a room later than themselves, we can assume that Benjamin trusts Evelyn more than Charlotte or Ava. Therefore, he is more likely to believe Evelyn's claim about the onion's location. + +However, we are not asked about the onion's location. We are asked about the persimmon's location. We need to determine where Benjamin thinks Charlotte thinks Evelyn thinks Ava thinks the persimmon is. + +We know that Charlotte moved the persimmon from the blue_crate to the red_crate, but we don't know if she told anyone where she put it. Evelyn moved the persimmon from the red_crate to the blue_cupboard, but we don't know if she told anyone where she put it. Amelia moved the persimmon from the blue_cupboard to the green_pantry, but we don't know if she told anyone where she put it. + +Therefore, we cannot determine where Benjamin thinks Charlotte thinks Evelyn thinks Ava thinks the persimmon is. The answer is not given in the story and cannot be deduced based on the information provided. + +The correct answer is not listed among the multiple-choice options. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_11/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8c8a78b0ff285fcc9110c72d2e02516f5691f063 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_11/order_0.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where is the grapes really? +Answer: blue_pantry +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: To solve this question, we need to track the movements of the grapes and the statements made by the agents. According to the story, the grapes were initially in the blue_pantry (Step 2), then Benjamin moved them to the blue_suitcase (Step 3), and later Alexander moved them to the red_crate (Step 11), and finally, Owen moved them to the blue_pantry (Step 13). + +Now, we need to consider the statements made by the agents. Benjamin publicly claimed that the watermelon is in the green_pantry (Step 27), but we cannot trust his statement as he tends to lie. Owen privately told Benjamin that the watermelon is in the red_pantry (Step 29), but this statement does not provide any information about the location of the grapes. Liam likes the red_bucket (Step 15), but this statement is also irrelevant to the location of the grapes. + +Alexander lost his gloves (Step 7) and made no movements in the garage (Steps 22-23), so his actions do not provide any information about the location of the grapes. Elizabeth made no movements and stayed in the workshop for 1 minute (Step 8-9), so her actions are also irrelevant. + +Finally, we need to consider the exit order of the agents. Benjamin exited the workshop first (Step 4), followed by Liam (Step 6), Elizabeth (Step 9), Alexander (Step 23), and Owen (Step 21). Benjamin, Alexander, and Owen entered the waiting room together (Step 26), but we cannot trust Benjamin's claim about the location of the watermelon (Step 27). + +Therefore, based on the movements of the grapes and the information provided by the story, we can conclude that the grapes are in the blue_pantry (Option A). \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_11/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..59ac153b92197534bc36bd5012c14dcde9423fad --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_11/order_1.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Benjamin really think the grapes is? +Answer: blue_suitcase +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to trace Benjamin's movements and his interactions with other agents. According to the story, Benjamin moved the grapes from the blue_pantry to the blue_suitcase and later lost his phone. Alexander then moved the grapes from the blue_suitcase to the red_crate. Finally, Owen moved the grapes from the red_crate to the blue_pantry. + +However, we also know that agents tend to lie, and that Benjamin publicly claimed that the watermelon is in the green_pantry, which suggests that he may not be truthful about the location of the grapes either. + +Therefore, we need to look for any private interactions that Benjamin had with other agents. The only private interaction mentioned in the story is when Owen privately told Benjamin that the watermelon is in the red_pantry. We can assume that if Owen was truthful about the watermelon, he may also be truthful about the grapes. + +Therefore, the answer is O. red_pantry, as that is where Owen told Benjamin the watermelon was located, and where Benjamin may believe the grapes to be located as well. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_11/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b6c0dce30e6ef669d0ac8af9562016ba40583654 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_11/order_2.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Liam think Benjamin thinks the grapes is? +Answer: blue_suitcase +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to track the movements of Benjamin and the grapes, as well as Liam's movements and interactions with Benjamin. + +According to the story, Benjamin initially moved the grapes from the blue_pantry to the blue_suitcase, and later moved the watermelon to the red_pantry. Liam made no movements while in the workshop, but later expressed a preference for the red_bucket. + +There is no direct interaction between Liam and Benjamin regarding the location of the grapes. However, we do know that Owen moved the grapes to the blue_pantry after Benjamin moved them to the blue_suitcase, and Alexander later moved them to the red_crate. + +Based on these movements, it is possible that Liam may think Benjamin still believes the grapes are in the blue_suitcase, since Liam did not witness Owen or Alexander moving the grapes. However, we cannot be certain of this, as Liam may have overheard or been told about the movements of the grapes by another agent. + +Therefore, the answer to the question is E. blue_suitcase, but with some uncertainty. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_11/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..16f411d608d909d652659ab16cab3b7ef123a78f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_11/order_3.txt @@ -0,0 +1,68 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Elizabeth think Liam thinks Benjamin thinks the grapes is? +Answer: blue_suitcase +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Where does Elizabeth think Liam thinks Benjamin thinks the grapes is? + +2. We need to determine what each agent knows about the location of the grapes. + +3. Benjamin moved the grapes from the blue_pantry to the blue_suitcase, then lost his phone. + +4. Liam made no movements and stayed in the workshop for 1 minute, then exited. + +5. Alexander moved the grapes from the blue_suitcase to the red_crate, then lost his gloves. + +6. Owen moved the grapes from the red_crate to the blue_pantry. + +7. Based on assumption (1), we know that Elizabeth witnessed all of these movements before exiting the workshop. + +8. However, we don't know if Elizabeth had any private or public interactions with Liam or Benjamin about the location of the grapes. + +9. Based on assumption (3), we know that Elizabeth's public claims may not reflect her actual thoughts. + +10. Based on assumption (4), we know that Elizabeth may trust Benjamin's claim about the location of the grapes, since he exited the garage after her. + +11. Based on assumption (2), we can only infer what Elizabeth thinks Liam thinks Benjamin thinks about the location of the grapes if they had private or public interactions. + +12. There is no mention of any private interactions between Elizabeth, Liam, and Benjamin. + +13. However, based on assumption (5), we know that Elizabeth may have heard Benjamin's public claim about the location of the watermelon in the green_pantry. + +14. Therefore, Elizabeth may think that Liam thinks Benjamin thinks the grapes are in the green_pantry. + +15. The answer is K. green_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_11/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c87c2e85d171a3922cf342915f3815ff0fa2b649 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_11/order_4.txt @@ -0,0 +1,60 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Alexander think Elizabeth thinks Liam thinks Benjamin thinks the grapes is? +Answer: blue_suitcase +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Liam think the grapes are? +- Liam made no movements and stayed in the workshop for 1 minute, so he did not see the grapes being moved. +- The grapes were initially in the blue_pantry, but were moved to the blue_suitcase by Benjamin. +- Therefore, Liam likely still thinks the grapes are in the blue_pantry. + +2. Where does Elizabeth think Liam thinks the grapes are? +- Elizabeth made no movements and stayed in the workshop for 1 minute, so she did not see the grapes being moved either. +- We know that Liam likely thinks the grapes are in the blue_pantry. +- However, we don't have any information about what Elizabeth thinks about the location of the grapes, so we cannot determine where she thinks Liam thinks they are. + +3. Where does Alexander think Elizabeth thinks Liam thinks Benjamin thinks the grapes are? +- Alexander moved the grapes from the blue_suitcase to the red_crate after Benjamin had already left the workshop. +- We know that Liam likely thinks the grapes are in the blue_pantry, but we don't know what Elizabeth thinks. +- Benjamin lost his phone in the garage after moving the watermelon to the red_pantry, so he did not hear any public claims about the location of the grapes. +- However, Owen privately told Benjamin that the watermelon is in the red_pantry, so Benjamin knows that Owen is trustworthy. +- Alexander made no movements in the garage and stayed there for 1 minute, so he did not see the watermelon being moved. +- Therefore, Alexander likely trusts Benjamin's claim that the watermelon is in the green_pantry, and he likely thinks that Owen is telling the truth about the location of the watermelon. +- Since Owen privately told Benjamin that the watermelon is in the red_pantry, Alexander likely thinks that Benjamin knows the true location of the watermelon. +- We don't have any information about what Liam thinks about the location of the grapes, so we cannot determine where Alexander thinks Elizabeth thinks Liam thinks Benjamin thinks the grapes are. + +Based on the information given, we cannot determine the answer to the question. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_12/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fe8616662f71e781a77ac0fd9b5794cbbab947fd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_12/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where is the spinach really? +Answer: green_envelope +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To answer this question, we need to track the movements of the agents and the spinach. According to the story, the spinach was initially in the green_envelope (step 3). Mila then moved the spinach to the blue_container (step 4), and Jackson later moved it back to the green_envelope (step 12). Therefore, the spinach is in the green_envelope, which is option L. The other options are not mentioned in the story. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_12/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..455b95b99c9b71c87cc06b05ce3856110d5cb1a7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_12/order_1.txt @@ -0,0 +1,39 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Avery really think the spinach is? +Answer: blue_container +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to track Avery's movements and any interactions he had with other agents. According to the story, Avery entered the kitchen with Mila, Nathan, Isabella, and Jackson. He made no movements and stayed in the kitchen for 1 minute before exiting. Then, he entered the pantry with Jackson and Mila, moved the pear to the green_bucket, and exited the pantry. Finally, he entered the waiting_room with Jackson and Mila. + +There is no mention of Avery having any private or public interactions where he could have shared his thoughts on the location of the spinach. However, we do know that Mila moved the spinach from the green_envelope to the blue_container before exiting the kitchen. Jackson then moved the spinach back to the green_envelope before they all entered the waiting_room. + +Based on Avery's movements and the assumption that he tends to trust agents who exited the room later than himself, we can infer that he may believe the spinach is in the green_envelope since Jackson was the last one to touch it before they all left the kitchen. Therefore, the answer is L. green_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_12/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..17ff09ce1b8b2e0353c2775cc6820677cc8bbc0d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_12/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Jackson think Avery thinks the spinach is? +Answer: blue_container +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to track the movements of Jackson and Avery in relation to the spinach. We know that the spinach was initially in the green_envelope, but Mila moved it to the blue_container before exiting the kitchen. Jackson then moved the spinach back to the green_envelope before leaving the kitchen. + +After leaving the kitchen, Jackson, Avery, Mila, Nathan, and Isabella all entered the waiting_room. Then, Jackson, Avery, and Mila entered the pantry. We don't know if Avery saw the spinach in the blue_container before leaving the kitchen, but we do know that Avery moved the pear to the green_bucket and then left the pantry. Mila then moved the pear to the blue_crate before leaving the pantry. + +The question asks where Jackson thinks Avery thinks the spinach is. Based on the story, we don't have any direct information about what Avery thinks about the spinach's location. However, we can make some inferences based on the movements of Jackson and Avery. + +Since Jackson moved the spinach back to the green_envelope before leaving the kitchen, he likely thinks that the spinach is still in the green_envelope. We also know that Avery moved the pear to the green_bucket in the pantry, so Jackson may trust Avery's judgment about where things are located. + +Therefore, Jackson may think that Avery thinks the spinach is in the green_envelope, since that is where Jackson believes it to be. The answer is L. green_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_12/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e69f2005991ee2699087033d429ff4131e3c9ae3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_12/order_3.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Isabella think Jackson thinks Avery thinks the spinach is? +Answer: blue_container +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: Step 1: Identify the relevant information in the story. Isabella, Jackson, and Avery were all in the kitchen and pantry at different times. Mila moved the spinach from the green envelope to the blue container. Jackson moved the spinach back to the green envelope. Avery moved the pear from the green bottle to the green bucket, and Mila moved it from the green bucket to the blue crate. Avery privately told Mila that the pear is in the green bottle, and Mila privately told Isabella that the pear is in the blue crate. + +Step 2: Determine the order of exits from the kitchen and pantry. Mila exited the kitchen first, followed by Nathan, Avery, Isabella, and Jackson. In the pantry, Jackson exited last, followed by Avery and Mila. + +Step 3: Determine who Isabella thinks Jackson thinks Avery thinks the spinach is. Isabella was in the kitchen with Jackson and Avery, but she did not move or touch the spinach. Jackson moved the spinach back to the green envelope after Mila had moved it to the blue container. Avery did not touch the spinach. Therefore, Isabella would likely think that Jackson thinks Avery thinks the spinach is in the blue container, since that is where Mila had moved it before Jackson moved it back to the green envelope. + +Step 4: Look for the answer choice that matches the location of the spinach that Isabella thinks Jackson thinks Avery thinks it is. The answer is O. blue_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_12/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ab45533f031d0a06846333436e037a6cb72fa3fe --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_12/order_4.txt @@ -0,0 +1,74 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Nathan think Isabella thinks Jackson thinks Avery thinks the spinach is? +Answer: blue_container +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to trace the movements of each agent and their interactions. + +1. Isabella saw a monkey. (No relevance to the question) +2. Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3. The spinach is in the green_envelope. +4. Mila moved the spinach to the blue_container. +5. Mila exited the kitchen. +6. Nathan made no movements and stayed in the kitchen for 1 minute. +7. Nathan exited the kitchen. +8. Avery made no movements and stayed in the kitchen for 1 minute. +9. Avery exited the kitchen. +10. Isabella made no movements and stayed in the kitchen for 1 minute. +11. Isabella exited the kitchen. +12. Jackson moved the spinach to the green_envelope. +13. Jackson exited the kitchen. +14. Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15. Jackson, Avery and Mila entered the pantry. +16. The pear is in the green_bottle. +17. Jackson made no movements and stayed in the pantry for 1 minute. +18. Isabella likes the blue_container. +19. Jackson exited the pantry. +20. Avery moved the pear to the green_bucket. +21. Avery exited the pantry. +22. Mila moved the pear to the blue_crate. +23. Mila exited the pantry. +24. Jackson, Avery and Mila entered the waiting_room. +25. Avery privately told Mila that the pear is in the green_bottle. +26. Mila privately told Isabella that the pear is in the blue_crate. + +Based on the assumption that agents tend to trust those who exit the room later than themselves, we know that Nathan trusts Isabella's thoughts more than Jackson's or Avery's. + +Isabella was in the kitchen when the spinach was in the green envelope, but Mila moved it to the blue container before leaving the kitchen. Isabella did not move the spinach herself, so she knows it is not in the green envelope anymore. + +In the pantry, Jackson stayed for a minute without moving, so he did not move the pear. Isabella likes the blue container, but Mila moved the pear to the blue crate after Avery moved it to the green bucket. Therefore, Isabella knows the pear is not in the blue container. + +Since Nathan trusts Isabella's thoughts more than Jackson's or Avery's, we can eliminate any options that involve Jackson or Avery's actions. The only options left are the ones that involve the spinach being in the blue container or the green envelope. + +Isabella was in the kitchen when the spinach was in the green envelope, but Mila moved it to the blue container before leaving the kitchen. Isabella did not move the spinach herself, so she knows it is not in the green envelope anymore. Therefore, Nathan thinks Isabella thinks the spinach is in the blue container. + +The answer is option E. blue_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_13/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a003466106b9cfc954fe31f1a00dc35d4080b0e4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_13/order_0.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where is the watermelon really? +Answer: red_container +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: To answer this question, we need to track the movements of each agent and their interactions. According to the story, Logan, William, Jacob, Sophia, and Isla entered the front yard. The watermelon was in the red container, and Jacob moved it to the red basket before exiting the front yard. Isla also moved the watermelon to the red container before exiting the front yard. Therefore, the watermelon is in the red container. The answer is A. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_13/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..da2e8d1d15b3959d0363cd9ca8c16d26cd14cb50 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_13/order_1.txt @@ -0,0 +1,39 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Jacob really think the watermelon is? +Answer: red_basket +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To answer this question, we need to follow Jacob's movements and interactions with other agents. Jacob moved the watermelon to the red_basket and then exited the front_yard. He then entered the waiting_room with Logan, William, Sophia, and Isla. Later, he entered the hall with Logan and William, where William moved the eggplant to the red_pantry. Jacob made no movements and stayed in the hall for 1 minute before exiting. Finally, Jacob re-entered the waiting_room with Logan and William, where Logan publicly claimed that the eggplant is in the red_box and Jacob privately told Isla that the eggplant is in the red_pantry. + +Based on the assumptions given, we know that Jacob's private communication with Isla is the most reliable source of information about his actual thought. Therefore, we can conclude that Jacob really thinks the watermelon is in the red_basket, as there is no evidence to suggest otherwise. The correct answer is D. red_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_13/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..22cbdc2e2fc6f040fac4ba2197751795854468f4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_13/order_2.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Isla think Jacob thinks the watermelon is? +Answer: red_basket +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: The question is asking about Isla's thoughts on where Jacob thinks the watermelon is. To answer this question, we need to look at the actions and interactions of Isla and Jacob in the story. + +Step 1: Identify when Isla and Jacob were in the same place or had interactions. + +- Isla and Jacob were both in the front yard at different times. +- Jacob privately told Isla about the location of the eggplant in the red_pantry. + +Step 2: Determine if Jacob's actions or interactions give any indication of where he thinks the watermelon is. + +- Jacob moved the watermelon to the red_basket before leaving the front yard. +- There is no indication that Jacob made any public claims about the location of the watermelon. + +Step 3: Use the assumptions to determine Isla's thoughts on where Jacob thinks the watermelon is. + +- Isla and Jacob were in the same place (front yard) at different times, so Isla can infer Jacob's actions. +- Isla knows that Jacob moved the watermelon to the red_basket, so she may think that he believes the watermelon is in the red_basket. +- Isla also knows that Jacob privately told her about the location of the eggplant, so she may trust his information about the watermelon. +- Isla may also consider that Jacob could be lying or mistaken about the location of the watermelon. + +Based on this analysis, Isla may think that Jacob thinks the watermelon is in the red_basket. Therefore, the answer is D. red_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_13/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..15db59068e46699335e5079dca6dc8acbc03aff7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_13/order_3.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Logan think Isla thinks Jacob thinks the watermelon is? +Answer: red_container +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Here are the steps to solve the question: + +1. Identify the agents involved in the question: Logan, Isla, and Jacob. +2. Determine the last place where Logan, Isla, and Jacob were together: the waiting_room. +3. Determine the last action related to the watermelon: Isla moved the watermelon to the red_container. +4. Determine the last action related to Jacob and the eggplant: Jacob privately told Isla that the eggplant is in the red_pantry. +5. Apply the assumptions to determine what Logan thinks Isla thinks Jacob thinks about the watermelon: +- Logan was in the waiting_room with Isla and Jacob, so he can infer Jacob's thought from Isla's private conversation. +- Logan publicly claimed that the eggplant is in the red_box, which means he is lying. +- Isla and Jacob did not have any public or private interactions related to the watermelon, so Logan cannot infer their thoughts directly. +- Isla exited the front_yard after Jacob, so Logan tends to trust her more than Jacob. +- Therefore, Logan thinks Isla thinks Jacob thinks the watermelon is in the red_container, which is the last known location of the watermelon. + +The answer is A. red_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_13/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..273ba5fcc8bb8c2b50f4d134b82b1589dd3c247f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_13/order_4.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Sophia think Logan thinks Isla thinks Jacob thinks the watermelon is? +Answer: red_container +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Sophia made no movements and stayed in the front_yard for 1 minute. +2. Logan exited the front_yard. +3. Isla moved the watermelon to the red_container. +4. Isla exited the front_yard. +5. Logan, William, Jacob, Sophia and Isla entered the waiting_room. +6. Logan, William and Jacob entered the hall. +7. Logan made no movements and stayed in the hall for 1 minute. +8. Logan exited the hall. +9. Sophia dislikes the potato. +10. Jacob privately told Isla that the eggplant is in the red_pantry. + +Based on these steps, we can infer that Sophia did not witness the movement of the watermelon to the red_container, nor did she witness Logan's claim about the eggplant being in the red_box. Therefore, she cannot know where Logan thinks Isla thinks Jacob thinks the watermelon is. + +The correct answer is: None of the above. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_14/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ed1e613f1f7f8efd9fd99eab83fdd8e7e2bff6f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_14/order_0.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where is the pear really? +Answer: blue_pantry +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: To answer this question, we need to track the movements of the agents and the location of the pear. According to the story, Isabella, Owen, Amelia, Aiden, and Nathan entered the sunroom. Isabella made no movements and stayed in the sunroom for 1 minute before exiting. Owen also made no movements and stayed in the sunroom for 1 minute before exiting. Amelia moved the pear to the green_bucket before exiting the sunroom. Aiden then moved the pear to the blue_suitcase before exiting the sunroom. Finally, Nathan moved the pear to the blue_pantry before exiting the sunroom. + +Therefore, the pear is in the blue_pantry, which is option L. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_14/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b4623bb6a05f1f91200b45ca0ddb2490a87fb2b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_14/order_1.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Nathan really think the pear is? +Answer: blue_pantry +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: To answer this question, we need to follow Nathan's movements and any interactions he had with other agents. Nathan moved the cherry to the red_container in the study and then Amelia moved it to the red_envelope. There is no information about Nathan's interactions with Isabella, Owen, Aiden, or Amelia regarding the pear. However, Isabella privately told Amelia that the cherry is in the blue_crate, which means that Isabella is lying about the cherry's location. Therefore, we cannot trust Isabella's claim about the pear's location either. + +Based on Nathan's movements and interactions, the only information we have is that he moved the cherry to the red_container in the study. We do not know where he thinks the pear is. Therefore, the answer is not given in the story and cannot be determined. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_14/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ea6922dd24ec7bf0ea6d1906db8af26a6ad0d58a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_14/order_2.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Amelia think Nathan thinks the pear is? +Answer: green_bucket +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: To answer this question, we need to track the movements of Nathan and the pear. According to the story, Nathan moved the pear to the blue_pantry (step 13) and later moved the cherry to the red_container (step 19). Amelia moved the pear to the green_bucket (step 8) and later moved the cherry to the red_envelope (step 21). Isabella privately told Amelia that the cherry is in the blue_crate (step 27). + +We don't have any information about Nathan's thoughts on the location of the pear, but we do know that Amelia moved the pear to a different location than where Nathan left it. Therefore, we can assume that Amelia does not think Nathan knows where the pear is. + +Looking at the answer choices, the only location where Nathan was known to have placed the pear is the blue_pantry, which is option L. Therefore, Amelia cannot think that Nathan thinks the pear is in any of the other locations. The answer is L. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_14/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..09728ebc0b61f69601a9ca5d8aecda3496862cc8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_14/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Isabella think Amelia thinks Nathan thinks the pear is? +Answer: blue_pantry +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Where does Nathan think the pear is? +We know that Nathan moved the pear to the blue_pantry (step 13), so that is where he thinks it is. + +2. Where does Amelia think the pear is? +Amelia moved the pear to the green_bucket (step 8), but we don't know if she saw Nathan move it to the blue_pantry. We also don't know if she had any private or public interactions with Nathan or Isabella that would give her more information. Therefore, we cannot determine where Amelia thinks the pear is. + +3. Where does Isabella think Amelia thinks the pear is? +Isabella privately told Amelia that the cherry is in the blue_crate (step 27), but we don't know if she mentioned anything about the pear. However, we do know that Isabella saw a mouse (step 7) and lost his gloves (step 11) while in the sunroom with Amelia and Aiden, who both moved the pear. Isabella also stayed in the study for 1 minute (step 23) and exited after Nathan and Amelia, who both moved the cherry. Based on the assumption that Isabella tends to trust agents who exited the room later than himself, he may trust Nathan's location of the pear in the blue_pantry. However, we cannot determine where Isabella thinks Amelia thinks the pear is. + +Therefore, the answer is indeterminate and cannot be determined based on the given information. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_14/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7ce2dad659cf2f20dcfcf1f72d3072b42b770a6b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_14/order_4.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Owen think Isabella thinks Amelia thinks Nathan thinks the pear is? +Answer: blue_pantry +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: This question requires a lot of steps to solve. Let's break it down: + +1. Owen thinks: We need to determine what Owen's thoughts are. There is no direct information about what Owen thinks, so we need to infer it based on the given information. + +2. Isabella thinks: We need to determine what Isabella thinks about the location of the pear. We know that Isabella lost her gloves, but that doesn't give us any information about what she thinks about the pear's location. + +3. Amelia thinks: We need to determine what Amelia thinks about the location of the pear. We know that Amelia moved the pear to the green_bucket and then exited the sunroom. We don't know if she made any claims about the pear's location. + +4. Nathan thinks: We need to determine what Nathan thinks about the location of the pear. We know that Nathan moved the pear to the blue_pantry and then later moved the cherry to the red_container. We don't know if he made any claims about the pear's location. + +5. Location of the pear: We need to determine the location of the pear based on what Isabella thinks Amelia thinks Nathan thinks. This requires us to trace the thought process backwards. + +Based on the given information, we know that Isabella privately told Amelia that the cherry is in the blue_crate. We don't know if Isabella made any claims about the location of the pear, so we can't use that information to determine what she thinks about the pear's location. + +We know that Amelia publicly claimed that the cherry is in the red_envelope. This claim doesn't give us any information about what she thinks about the pear's location. + +We know that Nathan moved the pear to the blue_pantry. We don't know if he made any claims about the pear's location. + +So, based on the given information, we can't determine where Isabella thinks Amelia thinks Nathan thinks the pear is. + +Therefore, the answer is none of the above (N/A). \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_15/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6480213d01527b7f0db1852df162a2047f8dd65d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_15/order_0.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where is the potato really? +Answer: blue_crate +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To answer this question, we need to track the movements of the potato and the statements made by the characters. According to the story, the potato was initially in the blue cupboard (step 3), then Chloe moved it to the green bottle (step 4), Nathan moved it to the blue bathtub (step 13), and finally, Noah moved it to the blue crate (step 25). + +Charlotte publicly claimed that the potato is in the blue cupboard (step 29), but we know that the characters tend to lie. Nathan privately told Noah that the potato is in the blue crate (step 31), but we don't know if Noah can be trusted. + +Based on the movements of the potato, the correct answer is D. blue_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_15/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..eeb573fad41c4ed5754bb4bb8e37b56126295709 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_15/order_1.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Charlotte really think the potato is? +Answer: blue_cupboard +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: To answer this question, we need to look for any public or private claims made by Charlotte or any interactions she had with other agents regarding the location of the potato. From the story, we know that Charlotte publicly claimed that the potato is in the blue_cupboard (in step 29). Therefore, the correct answer is A. blue_cupboard. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_15/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..145de715524367ac83275483d385c3ad97a46ee2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_15/order_2.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Noah think Charlotte thinks the potato is? +Answer: blue_cupboard +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: To answer this question, we need to track the movements of the potato and the preferences of Charlotte and Noah. We know that Nathan privately told Noah that the potato is in the blue_crate, so we can eliminate all options except for blue_crate. We also know that Charlotte publicly claimed that the potato is in the blue_cupboard, but we cannot trust her claim due to the assumption that every agent tends to lie. However, we do know that Charlotte likes the green_bucket and the blue_treasure_chest, but we do not have any information about her preference for the blue_crate. Therefore, we cannot determine where Charlotte thinks the potato is. However, we do know that Noah dislikes the cherry and that he trusts an agent that exited the room later than himself. Since Nathan exited the garden after Noah, Noah may trust Nathan's information about the location of the potato. Therefore, Noah may think that Charlotte thinks the potato is in the blue_crate. The answer is D. blue_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_15/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..928fb4502917d2cb976f23cfe03b9c1f91f62194 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_15/order_3.txt @@ -0,0 +1,77 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Ava think Noah thinks Charlotte thinks the potato is? +Answer: blue_cupboard +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. To start, we need to identify the agents involved in the question: Ava, Noah, and Charlotte. We also need to consider their movements and interactions in the story. + +Step 1: Identify Ava's movements and interactions +- Ava entered the garden with Chloe, Charlotte, Nathan, and Noah (line 2) +- Ava made no movements and stayed in the garden for 1 minute (line 10) +- Ava exited the garden (line 11) +- Ava likes the red_bucket (line 28) +- Ava did not have any public or private interactions related to the potato + +Step 2: Identify Noah's movements and interactions +- Noah entered the garden with Chloe, Charlotte, Nathan, and Ava (line 2) +- Noah moved the potato to the blue_cupboard (line 15) +- Noah moved the potato to the blue_crate (line 25) +- Noah exited the garden (line 16) +- Nathan privately told Noah that the potato is in the blue_crate (line 31) +- Noah dislikes the cherry (line 24) +- Noah did not have any public or private interactions related to Charlotte's thoughts about the potato + +Step 3: Identify Charlotte's movements and interactions +- Charlotte likes the blue_treasure_chest (line 1) +- Charlotte entered the garden with Chloe, Ava, Nathan, and Noah (line 2) +- Charlotte likes the green_bathtub (line 5) +- Charlotte made no movements and stayed in the garden for 1 minute (line 7) +- Charlotte exited the garden (line 8) +- Charlotte publicly claimed that potato is in the blue_cupboard (line 29) +- Charlotte likes the green_bucket (line 30) +- Charlotte did not have any private interactions related to the potato + +Step 4: Analyze the question +The question asks where Ava thinks Noah thinks Charlotte thinks the potato is. We know that Ava did not have any public or private interactions related to the potato, so she cannot know the actual location of the potato. However, we can use the assumptions to infer what Ava might think based on her observations and interactions with the other agents. + +- Ava was in the garden with Noah and Charlotte when they moved the potato (lines 2 and 15) +- Ava saw Charlotte make a public claim about the potato's location (line 29) +- Ava likes the red_bucket (line 28) + +Based on these observations, Ava might think that Noah thinks Charlotte thinks the potato is in the blue_cupboard (the location that Charlotte publicly claimed). This is because Ava saw Charlotte make the claim and Noah was present when she made it. However, we cannot be certain of Ava's thoughts since she did not have any private interactions related to the potato. + +Therefore, the answer is A. blue_cupboard. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_15/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..36a274eb9acae410d73c2984f7c3407ecc55a1ad --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_15/order_4.txt @@ -0,0 +1,86 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Nathan think Ava thinks Noah thinks Charlotte thinks the potato is? +Answer: blue_cupboard +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. To break it down, we need to identify the thought process of each agent and their interactions: + +- Charlotte likes the blue_treasure_chest. +- Chloe moved the potato from the blue_cupboard to the green_bottle. +- Charlotte likes the green_bathtub. +- Chloe exited the garden. +- Charlotte made no movements and stayed in the garden for 1 minute. +- Charlotte exited the garden. +- Ava made no movements and stayed in the garden for 1 minute. +- Ava exited the garden. +- Chloe likes the green_bottle. +- Nathan moved the potato from the green_bottle to the blue_bathtub. +- Nathan exited the garden. +- Noah moved the potato from the blue_bathtub to the blue_cupboard. +- Charlotte, Ava, and Nathan entered the garden. +- Charlotte made no movements and stayed in the garden for 1 minute. +- Charlotte exited the garden. +- Ava made no movements and stayed in the garden for 1 minute. +- Ava exited the garden. +- Noah dislikes the cherry. +- Nathan moved the potato from the blue_cupboard to the blue_crate. +- Nathan exited the garden. +- Charlotte, Ava, and Nathan entered the waiting_room. +- Ava likes the red_bucket. +- Charlotte publicly claimed that the potato is in the blue_cupboard. +- Charlotte likes the green_bucket. +- Nathan privately told Noah that the potato is in the blue_crate. + +Based on these events, we can infer the following thoughts: + +- Charlotte likes the blue_treasure_chest, the green_bathtub, and the green_bucket. She publicly claimed that the potato is in the blue_cupboard. +- Chloe likes the green_bottle. +- Ava likes the red_bucket. +- Nathan moved the potato from the green_bottle to the blue_bathtub, then to the blue_crate. He privately told Noah that the potato is in the blue_crate. +- Noah dislikes the cherry. + +To answer the question, we need to trace the chain of thoughts from Nathan to Ava to Noah to Charlotte and determine where Charlotte thinks the potato is. Here are the steps: + +1. Nathan thinks the potato is in the blue_crate. +2. Nathan thinks Noah thinks the potato is in the blue_crate (based on his private communication). +3. Ava's thought is unknown, as she made no public or private claims about the potato. +4. Nathan thinks Ava thinks the potato is in the blue_crate (based on his trust assumption). +5. Nathan thinks Ava thinks Noah thinks the potato is in the blue_crate (based on his inference from step 2 and trust assumption). +6. Charlotte publicly claimed that the potato is in the blue_cupboard, so she does not think the potato is in the blue_crate. +7. Therefore, Nathan thinks Ava thinks Noah thinks Charlotte thinks the potato is in the blue_cupboard. + +The answer is A. blue_cupboard. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_16/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3aac5eaf905f000c4240c54580d4481629ec4ee9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_16/order_0.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where is the cucumber really? +Answer: red_basket +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To answer this question, we need to track the movements of the cucumber and who moved it. According to the story, the cucumber was initially in the green_crate (statement 3). Benjamin moved it to the red_container (statement 5), and then Charlotte moved it to the red_basket (statement 7). Therefore, the cucumber is really in the red_basket. The answer is B. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_16/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a9cadf8caa09085a62d79f11af6e259c1ce251da --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_16/order_1.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Benjamin really think the cucumber is? +Answer: red_container +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: To answer this question, we need to follow Benjamin's movements and any interactions he had with other agents regarding the cucumber. According to the story, Benjamin dislikes asparagus and moved the cucumber from the green_crate to the red_container. Charlotte then moved the cucumber to the red_basket. There is no further mention of Benjamin's interactions with the cucumber. Therefore, based on the given information, Benjamin really thinks the cucumber is in the C. red_container. The correct answer is C. red_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_16/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4a7f81451681759d30f1c8df21818df28bb804fa --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_16/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Charlotte think Benjamin thinks the cucumber is? +Answer: red_container +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: To answer this question, we need to track the movements of the cucumber and who interacted with it. Benjamin moved the cucumber to the red_container, and then Charlotte moved it to the red_basket. Isla made no movements with the cucumber. Therefore, Charlotte is the only one who interacted with the cucumber after Benjamin. + +However, we also need to consider the fact that every agent tends to lie. Charlotte publicly claimed that the orange is in the green_bottle, but we cannot trust this claim. + +We also know that Evelyn privately told Benjamin that the orange is in the green_bucket. This means that Benjamin knows the true location of the orange, but it doesn't necessarily mean that he knows the location of the cucumber. + +Therefore, we cannot determine where Charlotte thinks Benjamin thinks the cucumber is based on the given information. The answer is not provided in the options given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_16/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..476bacf17f8b04cd55ecfb4ad7e690c24a885fbb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_16/order_3.txt @@ -0,0 +1,63 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Evelyn think Charlotte thinks Benjamin thinks the cucumber is? +Answer: red_container +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. To start, we need to identify the relevant agents and their movements: + +- Benjamin dislikes asparagus and likes the green treasure chest. +- Charlotte moved the cucumber to the red basket, stayed in the lounge for 1 minute, and publicly claimed that the orange is in the green bottle. +- Isla likes the blue bucket, made no movements in the lounge, and moved the orange to the green bathtub. +- Ava likes the blue treasure chest and made no movements in the lounge. +- Evelyn made no movements in the lounge, moved the orange to the green bucket, and privately told Benjamin that the orange is in the green bucket. + +Based on these movements, we can eliminate some answer choices: + +- A. green crate: This is where the cucumber was originally, but Benjamin moved it to the red container and Charlotte moved it to the red basket, so it's unlikely that Evelyn thinks Charlotte thinks Benjamin thinks the cucumber is still in the green crate. +- E. blue bucket: Isla likes the blue bucket, but there's no indication that Benjamin or Charlotte have any opinions about it, so it's unlikely that Evelyn is thinking about the blue bucket. +- F. blue cupboard, G. blue bottle, I. blue suitcase: There's no mention of these items in the story, so they can be eliminated. +- J. green pantry: This is not mentioned in the story, so it can be eliminated. +- D. red envelope: There's no mention of a red envelope in the story, so it can be eliminated. + +That leaves us with: + +- B. red basket: Charlotte moved the cucumber here, so it's possible that Evelyn thinks Charlotte thinks Benjamin thinks the cucumber is in the red basket. +- C. red container: Benjamin moved the cucumber here, so it's possible that Evelyn thinks Charlotte thinks Benjamin thinks the cucumber is in the red container. +- K. green bucket: This is where Evelyn moved the orange, and she privately told Benjamin that the orange is here. However, there's no direct connection between the orange and the cucumber, so it's unclear why Evelyn would be thinking about the green bucket in relation to the cucumber. +- L. green bottle: Charlotte publicly claimed that the orange is in the green bottle, so it's possible that Evelyn thinks Charlotte thinks Benjamin thinks the cucumber is in the green bottle. +- M. green cupboard: There's no mention of a green cupboard in the story, so it can be eliminated. +- N. green treasure chest: Benjamin likes the green treasure chest, but there's no indication that Charlotte or Evelyn have any opinions about it, so it's unlikely that Evelyn is thinking about the green treasure chest. +- O. green bathtub: Isla moved the orange here, so it's possible that Evelyn thinks Charlotte thinks Benjamin thinks the cucumber is in the green bathtub. + +Based on these options, the most likely answer is either B. red basket or C. red container, as those are the two places where Benjamin or Charlotte have directly interacted with the cucumber. However, without more information about Evelyn's thought process, it's impossible to say for sure which one she thinks Charlotte thinks Benjamin thinks the cucumber is in. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_16/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1829b1cb60a3199fe0b9cce9af12c477f14908e3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_16/order_4.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Isla think Evelyn thinks Charlotte thinks Benjamin thinks the cucumber is? +Answer: red_container +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Isla thinks: We need to consider Isla's movements and interactions with other agents. Isla entered the workshop, stayed there for 1 minute, then exited. She also entered the lounge with Charlotte and Evelyn, but we don't know if they had any private interactions. Isla moved the orange to the green_bathtub, but we're not interested in that. We need to focus on the cucumber. Isla made no movements with the cucumber, so we don't know what she thinks about it. + +2. Evelyn thinks: We know that Evelyn privately told Benjamin that the orange is in the green_bucket. This means that Evelyn knows where the orange is, but we don't know if she knows anything about the cucumber. We need to look for any interactions between Evelyn and the cucumber. + +3. Charlotte thinks: We know that Charlotte publicly claimed that the orange is in the green_bottle. This means that Charlotte thinks the orange is in the green_bottle, but we don't know if she knows anything about the cucumber. We need to look for any interactions between Charlotte and the cucumber. + +4. Benjamin thinks: We know that Benjamin dislikes the asparagus and likes the green_treasure_chest. We don't know if he knows anything about the cucumber. + +Based on this analysis, we can eliminate answer choices that are not related to the cucumber (e.g. blue_treasure_chest, green_bottle). We can also eliminate answer choices that are not supported by any interactions between the agents (e.g. red_envelope, blue_cupboard). + +The only answer choice that is supported by an interaction between two agents is red_container. Benjamin moved the cucumber to the red_container, so he knows where it is. Evelyn may or may not know where it is, but she did not have any private interactions with Isla, so Isla cannot infer her thoughts. Charlotte moved the cucumber to the red_basket, so she knows where it is. Isla did not make any movements with the cucumber, so she cannot have any thoughts about it. + +Therefore, the answer is C. red_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_17/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..bed0d2a7713037b22059967306c1d39b905baa4f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_17/order_0.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where is the cherry really? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: To answer this question, we need to track the movements of the cherry and the agents who interacted with it. + +First, Chloe moved the cherry from the red_drawer to the green_pantry. Then, Owen moved the cherry from the green_pantry to the green_bucket. + +Therefore, the cherry is in the green_bucket, which is option K. + +The correct answer is K. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_17/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cda62aaaf8f2c46cb8f1c0032eb5ab2c7b2f3616 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_17/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Owen really think the cherry is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: To answer this question, we need to look for any information related to Owen's thoughts about the cherry. According to the story, Owen moved the cherry to the green_bucket and then exited the staircase. There is no further information about Owen's thoughts or actions related to the cherry. Therefore, we can assume that Owen thinks the cherry is in the green_bucket. The answer is K. green_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_17/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f721a9e552342c8e233d9eea3640c3adb8bd702c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_17/order_2.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Ella think Owen thinks the cherry is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: To answer this question, we need to track the movements of the cherry and the agents' interactions. We know that Chloe moved the cherry from the red_drawer to the green_pantry, and Owen moved it from the green_pantry to the green_bucket. Ella, Emma, and Abigail made no movements with the cherry. + +We also know that Ella moved the apple from the blue_drawer to the green_bathtub, and Emma moved it from the green_bathtub to the red_crate, and Chloe moved it from the red_crate to the green_crate. Owen lost his watch, and Ella publicly claimed that the apple is in the blue_container, while Chloe privately told Owen that the apple is in the green_crate. + +Based on the assumptions, we can infer that Ella and Owen have not had any private or public interactions regarding the cherry. However, Ella and Owen were both in the staircase before exiting, and Ella exited the staircase after Owen. Therefore, Owen may trust Ella's observation more than the other agents who exited before her. + +Since we are looking for where Ella thinks Owen thinks the cherry is, we need to focus on Ella's movements and claims. Ella did not move the cherry, and she did not publicly claim anything about the cherry. Therefore, we need to look at where the cherry was last seen before Ella exited the staircase. + +According to the story, Owen moved the cherry from the green_pantry to the green_bucket before exiting the staircase. Therefore, Ella may think that Owen thinks the cherry is in the green_bucket. + +The answer is K. green_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_17/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8687330fe7de49cd563924d402dc015854a96840 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_17/order_3.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Abigail think Ella thinks Owen thinks the cherry is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Abigail think Ella thinks Owen thinks the cherry is? + +2. To answer this question, we need to start with Owen's movements. According to the story, Owen moved the cherry to the green_bucket. + +3. Next, we need to consider Ella's movements. Ella moved the apple to the green_bathtub, but there is no mention of her moving the cherry. + +4. Emma made no movements, so we can ignore her for now. + +5. Chloe moved the apple to the green_crate, but there is no mention of her moving the cherry. + +6. Abigail made no movements, so we need to consider her thoughts based on what she witnessed and what she was told. + +7. According to the story, Chloe privately told Owen that the apple is in the green_crate. This means that Abigail may have overheard this conversation and knows that Chloe thinks the apple is in the green_crate. + +8. However, we need to focus on the cherry, not the apple. There is no mention of anyone telling Owen where the cherry is, so we can assume that he doesn't know. + +9. Ella publicly claimed that the apple is in the blue_container, but this doesn't give us any information about the cherry. + +10. Based on the information we have, Abigail has no reason to think that Ella thinks Owen knows where the cherry is. + +11. Therefore, the answer is none of the above. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_17/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..75ae1f8278709627b7290639b9665efca1290ef9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_17/order_4.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Emma think Abigail thinks Ella thinks Owen thinks the cherry is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: This is a complex question that requires breaking down the thought process of each character. + +First, we need to determine where the cherry is currently located. We know that Chloe moved it to the green_pantry and Owen moved it to the green_bucket. Therefore, the cherry is currently in the green_bucket. + +Next, we need to determine who knows where the cherry is. Chloe and Owen both know where it is, but they have already exited the staircase and are not in communication with Abigail, Ella, or Emma. + +We know that Emma made no movements and stayed in the staircase for 1 minute, so she did not see where the cherry was moved. Ella and Abigail also made no movements and stayed in the staircase for 1 minute, so they did not see where the cherry was moved either. + +However, we do know that Chloe privately told Owen that the apple is in the green_crate. This means that Owen knows where the apple is, but he does not know where the cherry is. + +Based on the assumptions given, we know that Abigail can only infer where the cherry is based on the actions and statements of the other characters. She knows that Chloe moved the cherry to the green_pantry, but she does not know that Owen moved it to the green_bucket. Therefore, she may think that the cherry is still in the green_pantry. + +Ella made a public claim that the apple is in the blue_container, but this does not give any information about where the cherry is. + +Emma made no movements and stayed in the staircase for 1 minute, so she did not see where the cherry was moved. However, she knows that Chloe privately told Owen that the apple is in the green_crate. This means that she may think that Owen knows where the cherry is, but she does not know where Abigail or Ella think the cherry is. + +Therefore, the answer to the question is that we cannot determine where Emma thinks Abigail thinks Ella thinks Owen thinks the cherry is, as there is not enough information given to make that inference. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_18/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a3ee9a9ea0a8a6924f0fbf224211fb35d1e56307 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_18/order_0.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where is the sweet_potato really? +Answer: red_container +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: To solve this question, we need to track the movements of the sweet_potato and the agents. According to the story, the sweet_potato was initially in the red_drawer, then moved to the red_crate by Mila, and finally moved to the red_container by Mila again. + +We also know that Liam, Hannah, Emma, Mila, and Evelyn entered the cellar together, but only Liam, Hannah, and Emma exited before Mila moved the sweet_potato to the red_crate. This means that only Mila and Evelyn were in the cellar when the sweet_potato was moved to the red_crate. + +Later, Liam, Mila, and Evelyn entered the cellar together, and Liam stayed in the cellar for a minute before Mila moved the sweet_potato to the red_container. This means that only Mila and Evelyn knew the true location of the sweet_potato when they exited the cellar together. + +In the waiting_room, Mila publicly claimed that the sweet_potato was in the blue_container, but Evelyn privately told Mila that the sweet_potato was in the blue_suitcase. However, we know that Mila was the last to exit the cellar with the sweet_potato in the red_container, and agents tend to trust those who exit later than themselves. Therefore, it is likely that Mila is telling the truth about the sweet_potato being in the blue_container, and Evelyn is lying about its true location in the blue_suitcase. + +Therefore, the answer to the question is K. blue_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_18/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1f195b35c78a544b851c1e2175205a2373c813a5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_18/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Liam really think the sweet_potato is? +Answer: blue_container +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to track Liam's movements and any interactions he had with other agents regarding the sweet_potato. Liam entered the cellar with Hannah, Emma, Mila, and Evelyn. He made no movements and stayed in the cellar for 1 minute before exiting. Later, Liam, Mila, and Evelyn entered the cellar again, and Liam made no movements and stayed in the cellar for 1 minute before exiting. There is no mention of Liam having any private or public interactions regarding the sweet_potato. + +Based on these movements and interactions, we can eliminate all options except for D. red_basket and M. red_container. The sweet_potato was moved from the red_drawer to the red_crate by Mila, and later from the red_crate to the red_container by Mila. Liam was present in the cellar both times the sweet_potato was in the red container. Since Liam made no movements and had no interactions regarding the sweet_potato, we cannot determine his actual thought. However, we know that Liam tends to lie, so we cannot trust any public claims he may make. Therefore, the answer is either D. red_basket or M. red_container, but we cannot determine which one Liam actually thinks the sweet_potato is in. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_18/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..557c90dfff4241974561647b7ac6396d4fa0cce0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_18/order_2.txt @@ -0,0 +1,39 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Hannah think Liam thinks the sweet_potato is? +Answer: red_drawer +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: To answer this question, we need to track the movements and actions of Hannah and Liam regarding the sweet_potato. Liam did not move or interact with the sweet_potato during his time in the cellar, and Hannah also did not move or interact with it during her time in the cellar. Therefore, we can assume that Hannah has no direct knowledge of where Liam thinks the sweet_potato is. + +However, we do know that Mila moved the sweet_potato from the red_drawer to the red_crate while Hannah was not in the cellar. When Liam, Mila, and Evelyn re-entered the cellar, the sweet_potato was in the red_crate. Liam again did not move or interact with the sweet_potato during his time in the cellar. + +Therefore, we can infer that Liam thinks the sweet_potato is in the red_crate, since that is where it was when he was last in the cellar. However, we do not know if Hannah is aware of this information or if she has any other thoughts or beliefs about the sweet_potato's location. + +Based on the given options, we cannot definitively determine where Hannah thinks Liam thinks the sweet_potato is. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_18/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..44f964b269c2dc8cdb4e0677eabfb95df33d4aa6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_18/order_3.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Evelyn think Hannah thinks Liam thinks the sweet_potato is? +Answer: red_drawer +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Where does Evelyn think Hannah thinks Liam thinks the sweet_potato is? + +2. We need to determine where Liam thinks the sweet_potato is first. According to the story, Liam made no movements in the cellar and stayed there for 1 minute. When he exited the cellar, the sweet_potato was still in the red_drawer. Later, when Liam, Mila, and Evelyn entered the cellar again, Liam made no movements and stayed there for 1 minute. When he exited the cellar, Mila had moved the sweet_potato to the red_container. Therefore, Liam thinks the sweet_potato is in the red_container. + +3. We need to determine where Hannah thinks Liam thinks the sweet_potato is. According to the story, Hannah made no movements in the cellar and stayed there for 1 minute. When she exited the cellar, the sweet_potato was still in the red_drawer. There is no information about whether Hannah had any private or public interactions with Liam, so we cannot infer where she thinks Liam thinks the sweet_potato is. However, we do know that Liam exited the cellar before Hannah, so if Hannah trusts Liam more than herself, she would think the sweet_potato is in the red_container. + +4. We need to determine where Evelyn thinks Hannah thinks Liam thinks the sweet_potato is. According to the story, Evelyn made no movements in the cellar and stayed there for 1 minute. When she exited the cellar, the sweet_potato was still in the red_container. Later, Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. There is no information about whether Evelyn had any private or public interactions with Hannah, so we cannot infer where she thinks Hannah thinks Liam thinks the sweet_potato is. However, we do know that Evelyn exited the cellar after Liam, Mila, and Evelyn, so if Evelyn trusts Liam more than herself, she would think Hannah thinks Liam thinks the sweet_potato is in the red_container. + +5. Therefore, the answer is D. red_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_18/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7ed54ab3bd51edc1182f12cec58cd2fcf9f2d0df --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_18/order_4.txt @@ -0,0 +1,53 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Emma think Evelyn thinks Hannah thinks Liam thinks the sweet_potato is? +Answer: red_drawer +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Liam think the sweet_potato is? +- We know that Liam made no movements in the cellar and stayed there for 1 minute. When he exited the cellar, the sweet_potato was still in the red_drawer. Therefore, Liam thinks the sweet_potato is in the red_drawer (answer: L). + +2. Where does Hannah think the sweet_potato is? +- We know that Hannah made no movements in the cellar and stayed there for 1 minute. When she exited the cellar, the sweet_potato was still in the red_drawer. Therefore, Hannah also thinks the sweet_potato is in the red_drawer (answer: L). + +3. Where does Emma think the sweet_potato is? +- We know that Emma made no movements in the cellar and stayed there for 1 minute. When she exited the cellar, the sweet_potato was still in the red_drawer. Therefore, Emma also thinks the sweet_potato is in the red_drawer (answer: L). + +4. Where does Mila think the sweet_potato is? +- We know that Mila moved the sweet_potato from the red_drawer to the red_crate. When she exited the cellar, the sweet_potato was in the red_crate. Later, Mila moved the sweet_potato from the red_crate to the red_container. Therefore, Mila thinks the sweet_potato is in the red_container (answer: M). + +5. Where does Evelyn think the sweet_potato is? +- We know that Evelyn made no movements in the cellar and stayed there for 1 minute. When she exited the cellar, the sweet_potato was still in the red_crate. Later, Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. Therefore, Evelyn thinks the sweet_potato is in the blue_suitcase (answer: N). + +6. Where does Emma think Evelyn thinks Hannah thinks Liam thinks the sweet_potato is? +- This is the tricky part of the question. We need to work backwards from Evelyn's thought to Liam's thought, passing through Hannah's and Liam's thoughts. We know that Emma thinks the sweet_potato is in the red_drawer (answer: L). We also know that Evelyn thinks the sweet_potato is in the blue_suitcase (answer: N). Therefore, we need to find out where Mila thinks the sweet_potato is, because Mila is the last person to have moved the sweet_potato before Evelyn's private communication with her. We already know that Mila thinks the sweet_potato is in the red_container (answer: M). Therefore, Evelyn must have told Mila a lie, because the sweet_potato is not in the blue_suitcase. We also know that Mila publicly claimed that the sweet_potato is in the blue_container (answer: K). Therefore, Evelyn must have heard Mila's claim and decided to lie to her privately. We don't know what Hannah thinks about the sweet_potato's location, because she didn't move it and didn't have any private or public interactions with Evelyn. Therefore, we can't determine where Hannah thinks the sweet_potato is. Finally, we know that Liam thinks the sweet_potato is in the red_drawer (answer: L). Therefore, Emma thinks that Evelyn thinks Hannah thinks Liam thinks the sweet_potato is in the red_drawer (answer: L). + +Answer: L (red_drawer) \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_19/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f810b297e7393df027c3249ad7e055c08ee2c6be --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_19/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where is the carrot really? +Answer: blue_drawer +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: To answer this question, we need to track the movements of the agents and the location of the carrot. According to the story, the carrot was initially in the green_treasure_chest, but Noah moved it to the blue_suitcase. Emily later moved the carrot to the blue_drawer. Therefore, the carrot is in the blue_drawer. The answer is I. blue_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_19/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b12e8ab0c950fe7cfd23cbdf9bc8b3fb7469ea4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_19/order_1.txt @@ -0,0 +1,39 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Benjamin really think the carrot is? +Answer: blue_drawer +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: To answer this question, we need to track Benjamin's movements and any interactions he had with other agents regarding the location of the carrot. According to the story, Benjamin entered the pantry twice, and on his second visit, he moved the beans to the blue_drawer. He then exited the pantry and later publicly claimed that the beans were in the blue_bottle. There is no mention of Benjamin interacting with anyone about the location of the carrot, so we cannot infer his thoughts based on any private conversations. Therefore, we need to look for any clues about the carrot's location based on Benjamin's movements and actions. + +On his first visit to the pantry, Benjamin made no movements and stayed in the pantry for one minute before exiting. On his second visit, he moved the beans to the blue_drawer and then exited the pantry. We know that Noah moved the carrot from the green_treasure_chest to the blue_suitcase before exiting the pantry. Emily then moved the carrot from the blue_suitcase to the blue_drawer before exiting the pantry. There is no mention of Benjamin interacting with the carrot or moving it to a different location. + +Based on this information, we can conclude that Benjamin's actual thought about the location of the carrot is unknown. The story does not provide any evidence to suggest where Benjamin thinks the carrot is, so we cannot choose any of the options provided. The correct answer is therefore "unknown." \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_19/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ed9ab26c33c1ee1bf643b15efbc2758d3dbd994d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_19/order_2.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Noah think Benjamin thinks the carrot is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to track the movements of Noah and Benjamin and their interactions with the carrot. + +Noah moved the carrot from the green_treasure_chest to the blue_suitcase, and later made no movements in the pantry. Benjamin made no movements in the pantry, but later moved the beans from the blue_bottle to the blue_drawer and publicly claimed that the beans are in the blue_bottle. + +Since Noah and Benjamin were both in the pantry at different times and Benjamin made no movements related to the carrot, Noah would not have any reason to believe that Benjamin knows where the carrot is. Therefore, the answer is not A, B, C, D, E, G, K, L, M, N, or O. + +The only option left is I, the blue_drawer, which is where Emily moved the carrot to after Noah moved it to the blue_suitcase. Since Emily privately told Sophia that the beans are in the blue_drawer, it's possible that Noah overheard this conversation and may think that Benjamin knows where the carrot is. Therefore, the answer is I, blue_drawer. + +The answer is I, blue_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_19/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..3dae28b0a3bc5cb82f0dda701056ae2bd8fd7eb4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_19/order_3.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Emily think Noah thinks Benjamin thinks the carrot is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Here are the steps to solve the question: + +1. Identify the relevant agents: The question asks about Emily's thoughts about where Noah thinks Benjamin thinks the carrot is. So we need to focus on Emily, Noah, and Benjamin. + +2. Trace their movements: According to the story, Emily, Noah, and Benjamin entered the pantry together (step 15), and then Benjamin exited the pantry after moving the beans to the blue_drawer (step 18). Noah stayed in the pantry for 1 minute before exiting (step 19), and Emily made no movements and stayed in the pantry for 1 minute before exiting (step 22). Then they all entered the waiting_room together (step 24). + +3. Consider their interactions: The story tells us that Benjamin publicly claimed that the beans are in the blue_bottle (step 25), but we don't know if anyone believed him. Emily privately told Sophia that the beans are in the blue_drawer (step 26), but we don't know if Noah or Benjamin heard her. + +4. Infer their thoughts: Based on the assumptions, we know that Emily can only infer Noah's thoughts if they have been in the same place or had private or public interactions. Emily was in the pantry with Noah and Benjamin, but we don't know if they had any interactions that would reveal their thoughts about the carrot. We also know that agents tend to lie, so we can't trust what they say to each other or publicly. + +5. Use logic to eliminate options: We can eliminate some options based on the story. For example, we know that the carrot was initially in the green_treasure_chest (step 2) and then moved to the blue_suitcase by Noah (step 3). We also know that Emily moved the carrot to the blue_drawer (step 9). So we can eliminate options that don't involve the blue_suitcase or blue_drawer. We also know that Noah dislikes the corn (step 10) and likes the red_basket (step 20), but we don't have any information about his thoughts on the carrot. + +6. Consider the exit order: According to assumption 4, agents tend to trust agents who exited the room later than themselves. In this case, we know that Noah exited the pantry before Emily (step 21), so Emily might not trust Noah's thoughts about the carrot. + +7. Make an educated guess: Based on the information we have, we can make an educated guess about where Emily thinks Noah thinks Benjamin thinks the carrot is. Since we know that the carrot was initially in the green_treasure_chest and then moved to the blue_suitcase by Noah, it's possible that Emily thinks Noah still believes the carrot is in the blue_suitcase. Benjamin moved the beans to the blue_drawer, so Emily might think he knows that the carrot is also in the blue_drawer. Therefore, Emily might think that Noah thinks Benjamin thinks the carrot is in the blue_drawer (option I). + +Answer: I. blue_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_19/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..dfce7eaaebc21a2f769dbe836a46e74f202f2e3d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_19/order_4.txt @@ -0,0 +1,67 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Sophia think Emily thinks Noah thinks Benjamin thinks the carrot is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Sophia thinks that Emily thinks that Noah thinks that Benjamin thinks the carrot is in a certain location. +2. We need to determine which location Sophia thinks this is. + +To solve this question, we need to trace the movements of the carrot and the agents in the story. Here are the key steps: + +1. The carrot is initially in the green_treasure_chest. +2. Noah moves the carrot to the blue_suitcase. +3. Emily moves the carrot to the blue_drawer. +4. Noah dislikes the corn. +5. Benjamin publicly claims that the beans is in the blue_bottle. +6. Emily privately tells Sophia that the beans is in the blue_drawer. + +Based on these steps, we can eliminate some of the answer choices. For example, we know that the carrot is not in the green_drawer or the red_container, because these locations are not mentioned in the story. We also know that the carrot is not in the blue_bottle, because Benjamin publicly claimed that the beans are in that location, not the carrot. + +To determine the correct answer, we need to consider the movements of the agents and their trust levels. Here are the key steps: + +1. Noah moves the carrot to the blue_suitcase and then exits the pantry. +2. Jack and Benjamin make no movements and then exit the pantry. +3. Emily moves the carrot to the blue_drawer and then exits the pantry. +4. Sophia makes no movements and then exits the pantry. +5. Benjamin, Noah, and Emily enter the pantry again. +6. Benjamin moves the beans to the blue_drawer and then exits the pantry. +7. Noah makes no movements and then exits the pantry. +8. Emily makes no movements and then exits the pantry. +9. Benjamin, Noah, and Emily enter the waiting_room. + +Based on these steps, we can infer that Sophia trusts Emily more than Noah or Benjamin, because Emily was the last to exit the pantry before they all entered the waiting_room together. Therefore, Sophia is most likely to believe that Emily's thoughts about the carrot's location are accurate. + +We also know that Emily moved the carrot to the blue_drawer, so Sophia thinks that Emily thinks that the carrot is in the blue_drawer. However, we need to consider Noah's dislike of corn. If Sophia is aware of this fact, she may believe that Noah would not have moved the carrot to a location near the corn. The only location that is not near the corn and is also mentioned in the answer choices is the blue_suitcase. Therefore, Sophia may think that Emily thinks that Noah thinks that Benjamin thinks the carrot is in the blue_suitcase. + +The correct answer is therefore J. blue_suitcase. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_2/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e996f13b30d18331306cf80256d51e20079c9093 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_2/order_0.txt @@ -0,0 +1,70 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where is the onion really? +Answer: blue_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To solve this question, we need to follow the movements of each agent and their interactions. + +1. Mila, Isabella, Owen, Emily, and Sophia entered the porch. +2. The onion is in the red_crate. +3. Mila made no movements and stayed in the porch for 1 minute. +4. Mila exited the porch. +5. Isabella made no movements and stayed in the porch for 1 minute. +6. Isabella exited the porch. +7. Owen moved the onion to the red_drawer. +8. Owen exited the porch. +9. Emily moved the onion to the red_bottle. +10. Emily exited the porch. +11. Sophia moved the onion to the red_crate. +12. Isabella lost his phone. +13. Sophia exited the porch. +14. Mila, Isabella, Owen, Emily, and Sophia entered the waiting_room. +15. Isabella, Mila, and Owen entered the porch. +16. The onion is in the red_crate. +17. Isabella moved the onion to the blue_crate. +18. Isabella exited the porch. +19. Sophia dislikes the onion. +20. Mila made no movements and stayed in the porch for 1 minute. +21. Mila exited the porch. +22. Owen made no movements and stayed in the porch for 1 minute. +23. Owen exited the porch. +24. Isabella, Mila, and Owen entered the waiting_room. +25. Isabella publicly claimed that onion is in the green_cupboard. +26. Owen privately told Emily that the onion is in the blue_crate. + +Based on the movements and interactions, we can eliminate some options. The onion was initially in the red_crate, then moved to the red_drawer by Owen, then to the red_bottle by Emily, and finally back to the red_crate by Sophia. Isabella moved the onion to the blue_crate, but we don't know if it was the same onion or a different one. + +Isabella publicly claimed that the onion is in the green_cupboard, but we know that the onion was last seen in the red_crate. Owen privately told Emily that the onion is in the blue_crate, which could be true if Isabella moved a different onion to the blue_crate. + +Therefore, the most likely answer is that the onion is in the red_crate (option L). + +a: 9 2 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_2/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..aee9e3b668bd2fbe543a14ff842153f7fab685f7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_2/order_1.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Owen really think the onion is? +Answer: blue_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: To solve this question, we need to follow Owen's movements and interactions with other agents. According to the story, Owen moved the onion to the red_drawer and then exited the porch. Later, Owen privately told Emily that the onion is in the blue_crate. Therefore, Owen really thinks that the onion is in the blue_crate. The answer is O. blue_crate. + +a: 7 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_2/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..fe0bf32aba270882da70a8a8e872c091ddf8c678 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_2/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Emily think Owen thinks the onion is? +Answer: blue_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: The question is asking about Emily's thoughts regarding where Owen thinks the onion is. To answer this question, we need to consider the actions and interactions of Emily and Owen in the story. + +Step 1: Emily moved the onion to the red_bottle, and then she exited the porch. + +Step 2: Owen moved the onion to the blue_crate, and then he exited the porch. + +Step 3: Owen privately told Emily that the onion is in the blue_crate. + +Based on these steps, we can conclude that Emily knows that the onion is in the blue_crate because Owen told her so privately. Therefore, Emily thinks that Owen thinks the onion is in the blue_crate. + +The answer is D. blue_bottle. + +a: 4 5 6 7 9 1 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_2/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b84b4e1416fb8c9032b84730b0f33632bcd4e990 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_2/order_3.txt @@ -0,0 +1,72 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Isabella think Emily thinks Owen thinks the onion is? +Answer: red_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: The question is asking for Isabella's belief about Emily's belief about Owen's belief about the location of the onion. To solve this question, we need to trace the path of the onion and the agents' movements and interactions. + +1. Mila, Isabella, Owen, Emily, and Sophia entered the porch. +2. The onion is in the red_crate. +3. Mila made no movements and stayed in the porch for 1 minute. +4. Mila exited the porch. +5. Isabella made no movements and stayed in the porch for 1 minute. +6. Isabella exited the porch. +7. Owen moved the onion to the red_drawer. +8. Owen exited the porch. +9. Emily moved the onion to the red_bottle. +10. Emily exited the porch. +11. Sophia moved the onion to the red_crate. +12. Isabella lost his phone. +13. Sophia exited the porch. +14. Mila, Isabella, Owen, Emily, and Sophia entered the waiting_room. +15. Isabella, Mila, and Owen entered the porch. +16. The onion is in the red_crate. +17. Isabella moved the onion to the blue_crate. +18. Isabella exited the porch. +19. Sophia dislikes the onion. +20. Mila made no movements and stayed in the porch for 1 minute. +21. Mila exited the porch. +22. Owen made no movements and stayed in the porch for 1 minute. +23. Owen exited the porch. +24. Isabella, Mila, and Owen entered the waiting_room. +25. Isabella publicly claimed that onion is in the green_cupboard. +26. Owen privately told Emily that the onion is in the blue_crate. + +Based on the story and assumptions, we know that Isabella lied about the onion's location when he claimed it was in the green_cupboard. We also know that Owen privately told Emily that the onion is in the blue_crate. Therefore, Emily knows that the onion is in the blue_crate. + +Isabella exited the porch before Owen, so he trusts Owen's information more than his own belief. Therefore, Isabella thinks that Owen thinks the onion is in the blue_crate. + +We don't have any information about where Emily thinks the onion is, but we know that she knows it's in the blue_crate. Therefore, Isabella thinks that Emily thinks Owen thinks the onion is in the blue_crate. + +The answer is D. blue_bottle. + +a: 4 5 6 7 9 1 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_2/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5ac7006a0f41533bb8914dd3b60e0be1d9467508 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_2/order_4.txt @@ -0,0 +1,67 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Sophia think Isabella thinks Emily thinks Owen thinks the onion is? +Answer: red_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Sophia think Isabella thinks Emily thinks Owen thinks the onion is? + +2. We know that Isabella publicly claimed that the onion is in the green_cupboard, but we cannot assume that this is true. + +3. Owen privately told Emily that the onion is in the blue_crate, but we cannot assume that Emily believes him. + +4. Sophia dislikes the onion, so we can assume that she has no idea where it is. + +5. Mila and Owen made no movements in the porch, so they have no new information about the onion's location. + +6. Isabella moved the onion from the red_crate to the blue_crate, so she knows that it is not in the red_crate. + +7. Based on assumption (2), we can assume that Isabella knows that Emily knows that the onion is not in the red_crate. + +8. Owen moved the onion from the red_crate to the red_drawer, so he knows that it is not in the red_crate. + +9. Based on assumption (4), we can assume that Emily trusts Owen's information and believes that the onion is in the blue_crate. + +10. Based on assumption (2), we can assume that Isabella knows that Owen knows that the onion is in the blue_crate. + +11. Based on assumption (2), we can assume that Isabella knows that Emily knows that Owen knows that the onion is in the blue_crate. + +12. Based on assumption (2), we can assume that Sophia knows that Isabella moved the onion from the red_crate to the blue_crate. + +13. Based on assumption (2), we can assume that Sophia knows that Isabella knows that Emily knows that Owen knows that the onion is in the blue_crate. + +14. Therefore, Sophia thinks that Isabella thinks Emily thinks Owen thinks the onion is in the blue_crate (option O). + +The answer is O. blue_crate. + +a: 4 5 6 7 9 1 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_20/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..80e3ad085becea91e47844d0e089c156f1e06d83 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_20/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where is the melon really? +Answer: blue_treasure_chest +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: To solve this question, we need to track the movements of each agent with the melon. According to the story, Lily did not move the melon, Amelia moved it to the green bucket, Jacob moved it to the green drawer, Evelyn moved it to the green bottle, and Ava moved it back to the blue treasure chest. Therefore, the melon is really in the blue treasure chest, which is option B. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_20/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6a0349271a4399a2d3099bfd57078b8328b5c2ad --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_20/order_1.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Jacob really think the melon is? +Answer: green_drawer +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: To answer this question, we need to track Jacob's movements with the melon and his interactions with other agents. Jacob moved the melon to the green_drawer before exiting the garden. However, we don't know if he actually thinks the melon is in the green_drawer or if he moved it there to deceive others. In the dining_room, Lily moved the cherry to the red_box before exiting, and then Jacob moved the cherry to the blue_bottle before exiting. Amelia moved the cherry to the red_envelope before exiting. In the waiting_room, Jacob publicly claimed that the cherry is in the red_box, but Amelia privately told Jacob that the cherry is in the red_envelope. + +Based on the assumptions given, we know that Jacob may be lying about where he thinks the melon is. However, we can infer that he trusts Amelia more than Lily because she exited the dining_room after him. Therefore, we can eliminate options A, D, E, F, H, I, J, K, L, N, and O because they were moved by Lily, and Jacob may not trust her. We can also eliminate option C because it was not mentioned in the story. + +That leaves us with option B, the blue_treasure_chest, which is where the melon was originally located before Amelia moved it to the green_bucket. Since Jacob was the first to move the melon, it's possible that he thinks it's still in the blue_treasure_chest. Therefore, the answer is B. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_20/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7caa127b6843eb1e6649eb3d51ea45a530f2e818 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_20/order_2.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Lily think Jacob thinks the melon is? +Answer: blue_treasure_chest +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: The question is asking about Lily's thoughts on Jacob's thoughts about the location of the melon. To answer this question, we need to trace Jacob's movements with the melon and determine where Lily was present with Jacob or had interactions with him. + +Jacob moved the melon to the green_drawer, which means Lily was not present with him at that time. However, Lily did have interactions with Amelia, who moved the melon to the green_bucket. Therefore, Lily knows that the melon was moved from the blue_treasure_chest to the green_bucket. + +Since Lily did not witness Jacob moving the melon to the green_drawer, she cannot be sure if he knows that the melon is now in the green_bucket. However, Lily did witness Ava moving the melon to the blue_treasure_chest, which was the original location of the melon. Therefore, Lily may think that Jacob still believes the melon is in the blue_treasure_chest. + +The answer is B. blue_treasure_chest. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_20/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..85e313f2c6ebc4bef513fcd44541aef13b2b5be7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_20/order_3.txt @@ -0,0 +1,60 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Evelyn think Lily thinks Jacob thinks the melon is? +Answer: blue_treasure_chest +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. We need to determine where Evelyn thinks Lily thinks Jacob thinks the melon is. This means we need to trace the movements of the melon and the agents' thoughts about its location. + +2. According to the story, the melon starts in the blue_treasure_chest and is moved by each agent in turn: Amelia to the green_bucket, Jacob to the green_drawer, Evelyn to the green_bottle, and finally Ava back to the blue_treasure_chest. + +3. Lily does not move the melon, but she does spend some time in the garden before leaving. + +4. We don't have any direct information about what any of the agents think about the melon's location, but we do know that they tend to lie and that they can infer each other's thoughts based on their interactions. + +5. We also know that Lily moves the cherry from the green_treasure_chest to the red_box in the dining_room, and that Jacob later moves it to the blue_bottle before Amelia moves it to the red_envelope. + +6. Finally, we know that Jacob publicly claims that the cherry is in the red_box, but Amelia privately tells him that it is actually in the red_envelope. + +Based on this information, we can make some educated guesses about where Evelyn thinks Lily thinks Jacob thinks the melon is. Here's our reasoning: + +- Lily never moves the melon, so she doesn't have any direct knowledge of its location. +- Jacob is the last agent to move the melon before it ends up back in the blue_treasure_chest, so he is the most recent person to have interacted with it. +- However, we know that Jacob lies and that Amelia tells him the truth about the cherry's location, so it's possible that he is lying about the melon as well. +- Evelyn moves the melon to the green_bottle, but we don't know if she has any reason to believe that this is the correct location. +- Based on the available information, it's difficult to say where Lily thinks Jacob thinks the melon is, let alone where Evelyn thinks Lily thinks Jacob thinks it is. + +Given these limitations, we can only eliminate some of the answer choices based on what we know about the story. For example, we know that the melon is not in the green_crate, the green_envelope, the red_basket, or the blue_suitcase, because these items are not mentioned in the story at all. We also know that the melon is not in the green_treasure_chest, because that is where the cherry is located. + +That leaves us with several possible answer choices: green_bottle, blue_treasure_chest, blue_bucket, green_bucket, green_drawer, green_bathtub, red_box, red_envelope, blue_container, and blue_bottle. + +Without more information about the agents' thoughts and interactions, it's impossible to say for sure where Evelyn thinks Lily thinks Jacob thinks the melon is. However, based on the available information, the most likely answer is either blue_treasure_chest (since that is where the melon starts and ends up) or green_bottle (since that is where Evelyn moves it). Therefore, the answer is either A. green_bottle or B. blue_treasure_chest. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_20/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7eba57fe11cde61dcdf3f8da1fcbbfe80820b45a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_20/order_4.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Ava think Evelyn thinks Lily thinks Jacob thinks the melon is? +Answer: blue_treasure_chest +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: This question requires a lot of logical reasoning and deduction. We need to trace the movements of the melon and the agents' thoughts about it. + +First, Lily did not move the melon and left the garden before anyone else moved it. Therefore, she has no idea where the melon is. + +Amelia moved the melon to the green_bucket, but we don't know if she told anyone about it. + +Jacob moved the melon to the green_drawer, but again, we don't know if he shared this information with anyone. + +Evelyn moved the melon to the green_bottle, but we don't know if she told anyone about it. + +Finally, Ava moved the melon back to the blue_treasure_chest. We don't know if she knew where the melon was before she moved it, but we do know that she put it back in the blue_treasure_chest. + +Now we need to consider the agents' thoughts about the melon's location. We know that Lily has no idea where the melon is. We don't know if Amelia, Jacob, or Evelyn shared their knowledge about the melon's location with anyone else. + +However, we do know that Jacob publicly claimed that the cherry is in the red_box, even though he moved it to the blue_bottle. This means that we can't trust Jacob's public claims about the location of objects. + +We also know that Amelia privately told Jacob that the cherry is in the red_envelope. This means that Amelia knows where the cherry is, but we don't know if she knows where the melon is. + +Based on all of this information, we can't definitively say where Ava thinks Evelyn thinks Lily thinks Jacob thinks the melon is. However, we do know that the melon was last seen in the blue_treasure_chest, which is option B. Therefore, the answer is B. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_3/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d6c5147ad1b17c40acb20328133c72116861a1b0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_3/order_0.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where is the peas really? +Answer: red_pantry +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: To solve this question, we need to follow the movements of each agent and their interactions. According to the story, the peas was initially in the red_bottle (step 2), then Isabella moved it to the green_bottle (step 7), then Hannah moved it to the blue_treasure_chest (step 9), and finally Chloe moved it back to the red_bottle (step 12). However, in step 17, when Isabella, Logan, and Emma entered the hallway again, the peas was back in the red_bottle. Logan publicly claimed that the peas is in the green_bottle (step 25), but Emma privately told Logan that the peas is in the red_bottle (step 26). Since Emma was in the hallway after Logan and had a private interaction with him, we can assume that Logan trusts her more than Isabella, who moved the peas to the blue_treasure_chest. Therefore, the peas is actually in the red_bottle, which is option A. + +a: 7 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_3/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9e342054c29595cdc20b8ab43a4553401433041c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_3/order_1.txt @@ -0,0 +1,43 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Emma really think the peas is? +Answer: red_pantry +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: To answer this question, we need to follow Emma's movements and interactions with other agents. Emma first enters the hallway with Logan, Isabella, Hannah, and Chloe. She then stays in the hallway for one minute before exiting. Later, she enters the hallway again with Isabella and Logan. Isabella moves the peas to the blue_treasure_chest before exiting, and Logan moves the peas to the blue_bathtub before exiting. Emma then moves the peas to the red_pantry before exiting. + +We know from the story that Logan publicly claimed that the peas is in the green_bottle, but Emma privately told Logan that the peas is in the red_bottle. However, we cannot assume that Emma actually thinks the peas is in the red_bottle just because she told Logan that. We need to consider her movements and interactions with other agents. + +Based on the story, Emma never moved the peas to the red_bottle. The peas was in the red_bottle when Logan first entered the hallway, and it was still in the red_bottle when Isabella, Logan, and Emma entered the waiting_room together. Emma only moved the peas once, to the red_pantry, after Isabella had already moved it to the blue_treasure_chest and Logan had moved it to the blue_bathtub. + +Therefore, the answer is B. red_pantry. Emma moved the peas to the red_pantry before exiting the hallway. + +a: 7 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_3/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..61d32e1d645675fd1a65d27de7fb87f620f238a4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_3/order_2.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Hannah think Emma thinks the peas is? +Answer: blue_treasure_chest +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: To answer this question, we need to track the movements of Hannah and Emma and their interactions with each other. + +According to the story, Hannah moved the peas to the blue_treasure_chest and then exited the hallway. Emma moved the peas to the red_pantry and then exited the hallway. + +Later, Logan publicly claimed that the peas is in the green_bottle, but Emma privately told Logan that the peas is in the red_bottle. + +Since Hannah and Emma did not have any interactions with each other, we cannot directly infer where Hannah thinks Emma thinks the peas is. However, we can use the assumption that an agent tends to trust an agent that exited the room later than himself. + +Since Hannah exited the hallway before Emma, she would not trust Emma's claim about the location of the peas. Therefore, Hannah would likely think that Emma thinks the peas is in a different location than what she privately told Logan. + +Based on the story, the only other location that the peas was in at some point is the blue_treasure_chest, which is where Hannah moved the peas to. Therefore, Hannah would likely think that Emma thinks the peas is in the blue_treasure_chest. + +The answer is E. blue_treasure_chest. + +a: 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_3/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..20da3defa4c59e57294194173eee52cf7af15669 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_3/order_3.txt @@ -0,0 +1,53 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Chloe think Hannah thinks Emma thinks the peas is? +Answer: blue_treasure_chest +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Chloe think Hannah thinks Emma thinks the peas is? + +2. Chloe exited the hallway before Hannah, so she trusts Hannah more than Emma. + +3. Hannah moved the peas to the blue_treasure_chest, so Chloe knows that Hannah thinks the peas is in the blue_treasure_chest. + +4. Emma privately told Logan that the peas is in the red_bottle, so Chloe knows that Emma thinks the peas is in the red_bottle. + +5. Chloe did not witness Isabella's movements, so she cannot infer where Isabella thinks the peas is. + +6. Isabella moved the peas to the green_bottle, but Chloe does not know this information. + +7. Therefore, Chloe thinks that Hannah thinks Emma thinks the peas is in the blue_treasure_chest. + +The answer is E. blue_treasure_chest. + +a: 5 6 7 9 2 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_3/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a721ab8fabd72cb209e7279fe541f19926aacd8b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_3/order_4.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Logan think Chloe thinks Hannah thinks Emma thinks the peas is? +Answer: blue_treasure_chest +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: This question requires a lot of steps to solve. Let's break it down: + +1. Logan publicly claimed that the peas is in the green_bottle. +2. Emma privately told Logan that the peas is in the red_bottle. +3. We need to determine where Logan thinks Chloe thinks Hannah thinks Emma thinks the peas is. + +To solve this question, we need to work backwards. We know that Emma told Logan that the peas is in the red_bottle, so Logan knows that the peas is not in the green_bottle. Therefore, we can eliminate options C, F, G, H, I, K, O. + +Next, we need to determine where Logan thinks Emma thinks the peas is. We know that Emma moved the peas to the red_pantry, but we don't know if Logan witnessed this. However, we do know that Isabella moved the peas to the blue_treasure_chest, and Logan moved the peas to the blue_bathtub. Therefore, Logan knows that the peas is not in the blue_treasure_chest or the blue_pantry. We can eliminate options E and L. + +Now, we need to determine where Logan thinks Hannah thinks the peas is. We know that Hannah moved the peas to the blue_treasure_chest, but we don't know if Logan witnessed this. However, we do know that Isabella dislikes the tangerine, which means she did not move the peas to the green_bottle (since the question states that the peas is in the red_bottle). Therefore, Logan knows that the peas is not in the green_bottle. We can eliminate option C. + +Finally, we need to determine where Logan thinks Chloe thinks Hannah thinks Emma thinks the peas is. We know that Chloe lost his phone and did not witness any of the movements of the peas. Therefore, Logan cannot infer what Chloe thinks about the location of the peas. + +Based on the above analysis, the answer to the question is A. red_bottle. + +a: 5 6 7 9 2 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_4/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..18698a1d59ab659d96058c69ce742523810d6ab0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_4/order_0.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where is the cherry really? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to track the movements of the cherry and the agents. According to the story, the cherry was initially in the blue_suitcase (statement 2). Isla moved the cherry to the red_bottle (statement 7), Ava moved it to the green_basket (statement 9), and finally, Nathan moved it back to the blue_suitcase (statement 11). Therefore, the cherry is in the blue_suitcase (option G). + +Note that we cannot trust any statements made by the agents, as they tend to lie (assumption 3). Also, the movements of Emma and William are not relevant to the location of the cherry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_4/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cbe0613ea878f886c2d3b42448b9aafbc60e659e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_4/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does Nathan really think the cherry is? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to trace Nathan's movements and any interactions he had with other agents. According to the story, Nathan moved the cherry to the blue_suitcase (step 11) and then exited the sunroom (step 13). There is no mention of Nathan having any private or public interactions with any other agents regarding the cherry's location. Therefore, we can assume that Nathan's actual thought is that the cherry is in the blue_suitcase. The answer is G. blue_suitcase. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_4/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..aed2387cfeeb69bb70ae46d25c82ba990c0bbf0d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_4/order_2.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does William think Nathan thinks the cherry is? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to track the movements of Nathan and the cherry. We know that the cherry was initially in the blue_suitcase, then Isla moved it to the red_bottle, Ava moved it to the green_basket, and finally Nathan moved it to the blue_suitcase again. + +We also know that William saw a cat before Nathan exited the sunroom, so he did not witness Nathan moving the cherry back to the blue_suitcase. + +Therefore, William would not know that the cherry is back in the blue_suitcase and would likely think that it is still in the last place he saw it, which was the red_bottle. + +So, the answer is I. red_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_4/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cd2919fe39c1b1930d069da16729c5c76cc760d8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_4/order_3.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does Ava think William thinks Nathan thinks the cherry is? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: This question requires a lot of attention to detail and inference based on the assumptions given. We need to track where the cherry and the agents are at each step and who knows what information. + +First, we know that Nathan moved the cherry to the blue_suitcase and William saw a cat after that. So, William cannot know where the cherry is. + +Next, we know that Isla moved the cherry to the red_bottle and Ava moved it to the green_basket before Nathan exited the sunroom. So, Nathan cannot know where the cherry is either. + +Therefore, Ava cannot think that William thinks Nathan knows where the cherry is. + +We can eliminate options A, B, C, and G. + +Now, we need to focus on where Ava thinks William thinks the cherry is. We know that Isla privately told William that the sweet_potato is in the green_bathtub. However, we cannot assume that William trusts Isla's information. + +We need to look at where the cherry was last seen before William exited the sunroom. The cherry was in the blue_suitcase, which is the same place where Nathan moved it. Therefore, Ava may think that William thinks the cherry is still in the blue_suitcase. + +The answer is option G, blue_suitcase. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_4/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3e03892e6e436eb5d0196554f12431b6e0655065 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_4/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does Emma think Ava thinks William thinks Nathan thinks the cherry is? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: This question requires a lot of deduction based on the given assumptions and the story. We need to trace the path of the cherry and the agents' movements to determine where Emma thinks Ava thinks William thinks Nathan thinks the cherry is. + +According to the story, the cherry starts in the blue_suitcase (step 2), then Isla moves it to the red_bottle (step 7), Ava moves it to the green_basket (step 9), and finally, Nathan moves it back to the blue_suitcase (step 11). + +William sees a cat after Nathan moves the cherry, so he doesn't know where the cherry is at the end. Isla privately tells William that the sweet_potato is in the green_bathtub (step 25), but we don't know if William believes her or not. + +Ava exits the laundry after moving the sweet_potato to the blue_cupboard (step 20), and Nathan exits the sunroom after moving the cherry to the blue_suitcase (step 11). Since William sees a cat after Nathan moves the cherry, he exits the sunroom after Nathan. + +Emma, Ava, and Isla enter the waiting_room together (step 23), and then Isla privately tells William that the sweet_potato is in the green_bathtub (step 25). Therefore, Emma knows that Isla told William about the sweet_potato, but she doesn't know where the cherry is. + +Based on the assumptions, Emma can infer where Ava thinks William thinks Nathan thinks the cherry is because she knows that Ava exited the laundry after moving the sweet_potato to the blue_cupboard (step 20), and Nathan exited the sunroom after moving the cherry to the blue_suitcase (step 11). Therefore, Emma thinks that Ava thinks William thinks Nathan thinks the cherry is in the blue_cupboard (option C). + +The answer is C. blue_cupboard. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_5/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..aa9462422befa927c016b83e4c2f42bd006818c6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_5/order_0.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where is the watermelon really? +Answer: blue_container +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to track the movements of the agents and the watermelon. According to the story, Benjamin moved the watermelon to the green_drawer, and then Isabella moved it to the blue_bucket. Therefore, the watermelon is in the blue_bucket. The answer is I. blue_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_5/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0a86b89fa87cf6a657e0adc4f62cfec2f808ec67 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_5/order_1.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Benjamin really think the watermelon is? +Answer: green_drawer +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: To answer this question, we need to track Benjamin's movements and statements regarding the watermelon. According to the story, Benjamin moved the watermelon from the blue_bottle to the green_drawer. He also made a statement that he dislikes lime. However, there is no mention of Benjamin making any statement or movement regarding the watermelon after he exited the workshop. Therefore, we can assume that Benjamin still thinks the watermelon is in the green_drawer. The answer is D. red_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_5/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c3eb6c8f0126721d4b46ad90e7872e1ff89a5afc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_5/order_2.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Emma think Benjamin thinks the watermelon is? +Answer: green_drawer +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: To answer this question, we need to track the movements of the watermelon and Benjamin's preferences. According to the story, Benjamin moved the watermelon from the blue_bottle to the green_drawer and likes the blue_bottle. Emma made no movements with the watermelon and exited the workshop after Benjamin. Therefore, Emma would know that Benjamin moved the watermelon to the green_drawer and likes the blue_bottle. So, Emma would think that Benjamin thinks the watermelon is in the G. blue_bottle. + +The answer is G. blue_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_5/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cbb8db185cf53c8033c4effbc443a542d676c91a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_5/order_3.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Isabella think Emma thinks Benjamin thinks the watermelon is? +Answer: green_drawer +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: To answer this question, we need to track the movements of the agents and their thoughts about the location of the watermelon. From the story, we know that Benjamin moved the watermelon from the blue_bottle to the green_drawer, and Isabella later moved it to the blue_bucket. We also know that Benjamin likes the blue_bottle and dislikes the lime. Emma made no movements and stayed in the workshop for 1 minute before exiting, so we don't have any information about her thoughts on the watermelon's location. + +Therefore, Isabella has no reason to think that Emma has any particular thoughts about the watermelon's location. The answer is none of the above. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_5/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..321cbf9db873477d6e6d4e1c6276e8acaad09e19 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_5/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Liam think Isabella thinks Emma thinks Benjamin thinks the watermelon is? +Answer: green_drawer +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: To solve this question, we need to trace the movements and thoughts of Liam, Isabella, Emma, and Benjamin regarding the watermelon. + +According to the story, Liam lost his phone when he entered the workshop with Benjamin, Isabella, Emma, and Charlotte. Benjamin moved the watermelon from the blue_bottle to the green_drawer and then exited the workshop. Isabella then moved the watermelon to the blue_bucket before exiting the workshop. Emma made no movements and stayed in the workshop for 1 minute before exiting. Charlotte then moved the watermelon to the blue_container before exiting. Liam made no movements and stayed in the workshop for 1 minute before exiting. + +Later, Liam, Isabella, Emma, Charlotte, and Benjamin entered the waiting_room. Charlotte, Liam, and Isabella then entered the lounge. The green_pepper is in the red_bottle, and Charlotte moved it to the green_envelope before exiting the lounge. Liam then moved the green_pepper to the red_drawer before exiting the lounge. Isabella then moved the green_pepper to the red_box before exiting the lounge. Liam likes the blue_bucket, and he privately told Isabella that the green_pepper is in the red_bottle. Isabella then privately told Benjamin that the green_pepper is in the red_box. + +Based on these movements and interactions, we can determine that Liam thinks Isabella thinks Emma thinks Benjamin thinks the watermelon is in the blue_bucket. + +Therefore, the answer is I. blue_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_6/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7c44ce72aa7f3f35120d2586674cc75adbf9f68a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_6/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where is the peach really? +Answer: red_basket +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To solve this question, we need to track the movements of each agent and their interactions. According to the story, the peach was initially in the red_basket (step 2). Then, William moved the peach to the green_bathtub (step 7), and Elizabeth moved it back to the red_basket (step 11). Therefore, the peach is in the red_basket, which is option L. The answer is L. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_6/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..438d3889fcdf6ea5ac68b847547de092e74f3765 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_6/order_1.txt @@ -0,0 +1,39 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does Chloe really think the peach is? +Answer: green_bathtub +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: To answer this question, we need to look at the movements of each agent and their interactions. Nathan and Isabella entered the basement first, but made no movements and exited after a minute each. William then moved the peach from the red_basket to the green_bathtub, and Chloe made no movements before exiting the basement. Finally, Elizabeth moved the peach back to the red_basket before all agents entered the waiting_room. + +Based on these movements, Chloe did not witness the peach being moved by William or Elizabeth. She also did not have any private or public interactions with Isabella or William regarding the peach's location. Therefore, the only information Chloe has is that the peach was initially in the red_basket before she entered the basement and that it was back in the red_basket when she exited. + +Therefore, Chloe really thinks the peach is in the red_basket. The answer is L. red_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_6/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a696cc59422efa5c6b73a8fef0309627f43156ee --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_6/order_2.txt @@ -0,0 +1,41 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does Isabella think Chloe thinks the peach is? +Answer: red_basket +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: To answer this question, we need to track the movements of Isabella and Chloe and the location of the peach. Isabella and Chloe both entered the basement and waited for a minute before leaving. William moved the peach from the red basket to the green bathtub before leaving. Elizabeth then moved the peach back to the red basket before leaving the basement. + +Based on the given assumptions, we know that Isabella and Chloe were in the same place and witnessed the movements of William and Elizabeth. Isabella privately told William that the beans are in the red box, but we don't know if she shared any information about the location of the peach with anyone. + +Therefore, we need to look at the movements of Chloe and the final location of the peach. Chloe made no movements in the basement and waited for a minute before leaving. We don't know if she saw William move the peach to the green bathtub or Elizabeth move it back to the red basket. However, we do know that the peach ended up in the red basket, which is the same location it was in when Nathan, Isabella, William, Chloe, and Elizabeth first entered the basement. + +Based on this information, we can conclude that Isabella thinks Chloe thinks the peach is in the red basket. Therefore, the answer is L. red_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_6/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4c3c886e66a7aa633fd18c41c51bbd2e6dae15d8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_6/order_3.txt @@ -0,0 +1,75 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does Nathan think Isabella thinks Chloe thinks the peach is? +Answer: red_basket +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Nathan and Isabella both entered the basement, but Nathan made no movements and stayed for only 1 minute before leaving. Isabella also made no movements and stayed for 1 minute before leaving. We don't know if they interacted or not. + +2. The peach is in the red_basket. This information is given to us directly. + +3. William entered the basement after Nathan and Isabella left, and he moved the peach to the green_bathtub before leaving. + +4. Chloe entered the basement after William left, but she made no movements and stayed for only 1 minute before leaving. + +5. Elizabeth entered the basement after Chloe left, and she moved the peach back to the red_basket before leaving. + +6. All five agents then entered the waiting_room together. + +7. Isabella, Elizabeth, and William then entered the workshop together. + +8. The beans is in the green_drawer. + +9. Isabella moved the beans to the red_box before leaving the workshop. + +10. Elizabeth then moved the beans to the blue_bucket before leaving the workshop. + +11. William then moved the beans to the red_bucket before leaving the workshop. + +12. Elizabeth dislikes the plum. This information is given to us directly. + +13. Isabella lost his phone. This information is given to us directly. + +14. William publicly claimed that the beans is in the green_drawer. + +15. Isabella privately told William that the beans is in the red_box. + +Based on these steps, we can start to piece together where Nathan thinks Isabella thinks Chloe thinks the peach is. We know that Nathan and Isabella were both in the basement at the same time, but we don't know if they interacted or not. We also know that Chloe entered the basement after Nathan and Isabella left, so Nathan wouldn't have any direct knowledge of Chloe's movements or thoughts. + +However, we do know that the peach was moved from the red_basket to the green_bathtub by William, and then back to the red_basket by Elizabeth. Isabella was present in the workshop when the beans were moved from the green_drawer to the red_box, and then privately told William about it. We don't know if Nathan was present for any of these events. + +So, where does Nathan think Isabella thinks Chloe thinks the peach is? We can eliminate any answer choices that don't involve the red_basket, since we know that the peach ended up there. We can also eliminate any answer choices that involve the workshop or waiting_room, since Chloe was only present in the basement. + +That leaves us with three possible answer choices: red_bucket, green_bathtub, and green_drawer. Of these, the most likely answer is green_drawer, since that's where the beans were originally located and Isabella was present when they were moved to the red_box. Nathan may assume that Isabella thinks Chloe also knows the location of the beans and therefore the peach, since they were both in the workshop together. + +Therefore, the answer is F. green_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_6/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..69bb2ea5d68118aaa6a6dc7e6be1e6950a5ef86b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_6/order_4.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does William think Nathan thinks Isabella thinks Chloe thinks the peach is? +Answer: red_basket +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: This is a complex question that requires careful analysis. We need to trace the path of the peach and the movements of the agents to determine where William thinks Nathan thinks Isabella thinks Chloe thinks the peach is. + +First, we know that the peach starts in the red_basket (step 2). Then, William moves the peach to the green_bathtub (step 7), and Elizabeth moves it back to the red_basket (step 11). + +Next, we need to consider the movements of the agents. Nathan and Isabella both enter and exit the basement without moving anything (steps 1, 3, 4, 5). Chloe also enters and exits the basement without moving anything (steps 1, 9, 10). + +In the workshop, Isabella moves the beans from the green_drawer to the red_box (steps 15, 16), and Elizabeth moves them from the red_box to the blue_bucket (steps 18, 19). William then moves the beans to the red_bucket (step 20) and publicly claims that they are in the green_drawer (step 25). Isabella privately tells William that the beans are actually in the red_box (step 26). + +Based on these movements and interactions, we can determine that William thinks Nathan thinks Isabella thinks Chloe thinks the peach is in the green_drawer (option F). Here's why: + +- Nathan and Isabella both enter and exit the basement without moving anything, so they have no information about the peach's location. +- Chloe also enters and exits the basement without moving anything, so she also has no information about the peach's location. +- In the workshop, Isabella moves the beans from the green_drawer to the red_box, so she knows that the peach is not in the green_drawer. +- Elizabeth moves the beans from the red_box to the blue_bucket, so she also knows that the peach is not in the green_drawer. +- William moves the beans to the red_bucket and publicly claims that they are in the green_drawer, but Isabella privately tells him that they are actually in the red_box. Therefore, William knows that the peach is not in the green_drawer. +- Since Nathan, Isabella, and Chloe have no information about the peach's location, William must rely on Elizabeth's movements to determine where the peach is. Elizabeth moved the peach from the green_bathtub to the red_basket, so William knows that Elizabeth thinks the peach is in the red_basket. +- William trusts Elizabeth's judgment because she exited the workshop after him (step 22), so he assumes that she has more information than he does. +- Therefore, William thinks that Nathan thinks Isabella thinks Chloe thinks the peach is in the green_drawer (option F). + +The answer is F. green_drawer. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_7/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e7b7594f799fac4bdea088723dde02d73a643593 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_7/order_0.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where is the asparagus really? +Answer: green_treasure_chest +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: To answer this question, we need to trace the movements of each agent and their interactions. According to the story, Hannah initially put the asparagus in the green cupboard, but later moved it to the green treasure chest. None of the other agents interacted with the asparagus or mentioned its location, so we can assume that it is still in the green treasure chest. Therefore, the correct answer is B. green_treasure_chest. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_7/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..893e37abb98f9c03de02137d67ab56f528655c4f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_7/order_1.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Aiden really think the asparagus is? +Answer: green_treasure_chest +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: To answer this question, we need to look at the movements of Hannah, Owen, Emily, Aiden, and Avery and their interactions. We know that Hannah moved the asparagus to the green_treasure_chest and the carrot to the green_drawer. Owen likes the green_basket and moved the carrot to the green_basket after Hannah. Aiden made no movements in the bathroom but privately told Emily that the carrot is in the green_basket. We don't have any information about Aiden's thoughts on the asparagus, but we know that Hannah moved it to the green_treasure_chest. Therefore, the answer is B. green_treasure_chest. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_7/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..be388b21897c91b4b484b85e6e1d1bbceb3be18f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_7/order_2.txt @@ -0,0 +1,42 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Emily think Aiden thinks the asparagus is? +Answer: green_treasure_chest +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: To answer this question, we need to track the movements of Aiden and Emily and their interactions with each other. Aiden made no movements in the hall and stayed in the bathroom for 1 minute before exiting. Emily made no movements in the hall and stayed in the hall for 1 minute before exiting. Aiden privately told Emily that the carrot is in the green_basket. + +We know that Emily likes the red_crate and that the carrot is not in the blue_crate. We also know that Hannah moved the carrot to the green_drawer and then Owen moved it to the green_basket. However, we are looking for where Emily thinks Aiden thinks the asparagus is, not the carrot. + +Unfortunately, there is no information in the story about where the asparagus is currently located. We only know that it was initially in the green_cupboard and then Hannah moved it to the green_treasure_chest. + +Therefore, we cannot answer this question with the given information. The correct answer is: Insufficient information. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_7/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..3deb6a9044397445c2edc314fe8b3c02a22bc2a7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_7/order_3.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Avery think Emily thinks Aiden thinks the asparagus is? +Answer: green_treasure_chest +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Avery think Emily thinks Aiden thinks the asparagus is? + +We need to determine the location of the asparagus according to the story. From step 2, we know that the asparagus is in the green_cupboard. However, we also know from step 4 that Hannah moved the asparagus to the green_treasure_chest. It's unclear whether Avery is aware of this movement, so we can't assume that she knows the asparagus is in the green_treasure_chest. + +2. What does Emily think about the location of the asparagus? + +We don't have any direct information about Emily's thoughts on the location of the asparagus. However, we do know that Aiden privately told Emily that the carrot is in the green_basket (step 27). This doesn't give us any information about the asparagus, but it does suggest that Emily trusts Aiden's information. + +3. What does Aiden think about the location of the asparagus? + +We don't have any direct information about Aiden's thoughts on the location of the asparagus. However, we do know that Aiden privately told Emily that the carrot is in the green_basket (step 27). This doesn't give us any information about the asparagus, but it does suggest that Aiden knows the location of the carrot. + +4. What does Avery think about Aiden's thoughts on the location of the asparagus? + +We don't have any direct information about Avery's thoughts on the location of the asparagus. However, we do know that Avery and Aiden were both in the hall together (step 10), so they could have had a private conversation about the location of the asparagus. We also know that Avery exited the hall after Aiden (step 11), so she may trust his information more than someone who exited earlier. + +Based on this analysis, we can't determine where Avery thinks Emily thinks Aiden thinks the asparagus is. The information we have is too limited and doesn't provide a clear answer to the question. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_7/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..90483992fc93755dbacb4d09d5ce692280af8e2e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_7/order_4.txt @@ -0,0 +1,65 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Hannah think Avery thinks Emily thinks Aiden thinks the asparagus is? +Answer: green_treasure_chest +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where is the asparagus? +- According to the story, the asparagus was initially in the green_cupboard (line 2), but Hannah moved it to the green_treasure_chest (line 4). + +2. Who likes the green_basket? +- Owen likes the green_basket (line 12). + +3. Where is the carrot? +- The carrot was initially in the blue_crate (line 17), but Hannah moved it to the green_drawer (line 19), and then Owen moved it to the green_basket (line 21). + +4. What did Hannah publicly claim about the carrot? +- Hannah publicly claimed that the carrot is in the blue_crate (line 26). + +5. What did Aiden privately tell Emily about the carrot? +- Aiden privately told Emily that the carrot is in the green_basket (line 27). + +Now, let's try to answer the main question: + +Where does Hannah think Avery thinks Emily thinks Aiden thinks the asparagus is? + +- We know that Hannah moved the asparagus to the green_treasure_chest (line 4), but we don't have any information about what Avery, Emily, or Aiden think about the asparagus. +- However, we do know that Avery was in the same room as Hannah, Owen, Emily, and Aiden before they entered the waiting_room (line 15). Therefore, Avery could have overheard their conversations or observed their movements. +- Since we don't have any direct information about what Avery thinks, we need to make some assumptions based on the given rules: + - Avery may have heard Hannah claim that the carrot is in the blue_crate (line 26), but since we know that Hannah tends to lie, Avery may not trust this claim. + - Aiden privately told Emily that the carrot is in the green_basket (line 27), but we don't know if Avery overheard this conversation or if Emily shared this information with Avery. + - Since Owen likes the green_basket (line 12) and moved the carrot there (line 21), Avery may assume that the asparagus is also in the green_basket. + - Emily likes the red_crate (line 18), but we don't know if she has any thoughts about the asparagus. + - Aiden made no movements in the bathroom (line 23), but we don't know if he has any thoughts about the asparagus. +- Based on these assumptions, we can conclude that Hannah may think that Avery thinks Emily thinks Aiden thinks the asparagus is in the green_basket (option H). \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_8/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..60e84276cf86d0780a93cdaeabbcd649b2af85ea --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_8/order_0.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where is the lettuce really? +Answer: green_pantry +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: To answer this question, we need to track the movements of the lettuce and the statements made by the agents. According to the story, the lettuce was initially in the green_pantry (step 2), then William moved it to the blue_cupboard (step 3), Charlotte moved it to the blue_bathtub (step 7), Aiden moved it to the red_box (step 9), and finally, Isla moved it back to the green_pantry (step 11). Therefore, the lettuce is really in the green_pantry. + +We can eliminate options B, E, F, G, H, K, L, M, N, and O as they are not mentioned in the story. Option I is mentioned in the story, but it is where Amelia tells William the location of the apple, not the lettuce. Option J is where Charlotte moved the apple to, but it is not the location of the lettuce. Therefore, the correct answer is A. green_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_8/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..507886d3cc79b49250df01dfa0e23c8b0290faf8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_8/order_1.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Isla really think the lettuce is? +Answer: green_pantry +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: To answer this question, we need to trace Isla's movements with the lettuce. According to the story, Isla moved the lettuce to the green_pantry before exiting the living_room. Therefore, Isla really thinks the lettuce is in the green_pantry. The answer is A. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_8/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..0f8a6c7105b38aae36991cf4129f42aa66e6899c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_8/order_2.txt @@ -0,0 +1,53 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Charlotte think Isla thinks the lettuce is? +Answer: blue_bathtub +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: To answer this question, we need to track the movements of the lettuce and the agents' interactions. + +1. William, Amelia, Charlotte, Aiden, and Isla entered the living_room. +2. The lettuce is in the green_pantry. +3. William moved the lettuce to the blue_cupboard. +4. William exited the living_room. +5. Amelia made no movements and stayed in the living_room for 1 minute. +6. Amelia exited the living_room. +7. Charlotte moved the lettuce to the blue_bathtub. +8. Charlotte exited the living_room. +9. Aiden moved the lettuce to the red_box. +10. Aiden exited the living_room. +11. Isla moved the lettuce to the green_pantry. +12. Isla exited the living_room. + +From the above movements, we can see that Isla moved the lettuce to the green_pantry before leaving the living_room. Therefore, Charlotte thinks that Isla thinks the lettuce is in the green_pantry. + +The answer is A. green_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_8/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..3fba80667ad9c1300d24d6bb6c18f85fe5eee383 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_8/order_3.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Amelia think Charlotte thinks Isla thinks the lettuce is? +Answer: blue_cupboard +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: To answer this question, we need to trace the movements of the lettuce and the agents' interactions. Here are the steps to follow: + +1. Amelia and Charlotte were both in the living room when the lettuce was moved by William from the green pantry to the blue cupboard. +2. Charlotte then moved the lettuce from the blue cupboard to the blue bathtub before leaving the living room. +3. Aiden then moved the lettuce from the blue bathtub to the red box before leaving the living room. +4. Isla finally moved the lettuce from the red box back to the green pantry before leaving the living room. +5. Amelia and Charlotte both entered the sunroom where Charlotte moved the apple from the red bucket to the blue container before leaving the room. +6. William then entered the sunroom and stayed there for a minute before leaving. +7. Amelia also stayed in the sunroom for a minute before leaving. +8. Charlotte, William, and Amelia then entered the waiting room where William publicly claimed that the apple was in the blue container. +9. Amelia privately told William that the apple was actually in the blue suitcase. + +Based on these movements and interactions, we can conclude that Amelia and Charlotte were both in the living room when the lettuce was moved from the green pantry to the blue cupboard by William. However, we don't have any information about what Isla or Aiden think about the lettuce's location. + +Therefore, the answer to the question is C. blue cupboard, which is where William moved the lettuce to before leaving the living room. We don't have any information about what Charlotte thinks about the lettuce's location, so we can't infer what Isla thinks about it either. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_8/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d42459ebf348ea5b4c396c5ff511666c8452247d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_8/order_4.txt @@ -0,0 +1,46 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Aiden think Amelia thinks Charlotte thinks Isla thinks the lettuce is? +Answer: blue_cupboard +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: Step 1: Identify the agents involved in the question. The question asks about Aiden's thoughts regarding Amelia's thoughts about Charlotte's thoughts about Isla's thoughts about the lettuce. Therefore, we need to focus on Aiden, Amelia, Charlotte, Isla, and the lettuce. + +Step 2: Trace the movements of the lettuce. The lettuce starts in the green_pantry, is moved to the blue_cupboard by William, then to the blue_bathtub by Charlotte, then to the red_box by Aiden, and finally back to the green_pantry by Isla. + +Step 3: Determine the interactions between the agents. There are no private or public interactions between Aiden and Amelia, so Aiden cannot directly know what Amelia thinks. However, Aiden can infer Amelia's thoughts if he knows what Charlotte thinks, since Amelia and Charlotte were in the sunroom together. William publicly claimed that the apple is in the blue_container, but we do not know if Aiden trusts William's claim. + +Step 4: Determine the exit order of the agents. Isla exited the living_room last, followed by William, Amelia, Charlotte, and Aiden. Therefore, Aiden trusts Isla the most and Charlotte the least. + +Step 5: Trace the movements of the apple. The apple starts in the red_bucket, is moved to the blue_container by Charlotte, and William publicly claims that it is in the blue_container. However, Amelia privately tells William that the apple is actually in the blue_suitcase. + +Step 6: Determine the answer. Since Aiden cannot directly know what Amelia thinks, he needs to infer her thoughts based on Charlotte's thoughts. Charlotte moved the lettuce to the blue_bathtub, so Aiden knows that Charlotte does not think the lettuce is in the green_pantry. Since Aiden trusts Isla the most, he assumes that Isla thinks the lettuce is in the green_pantry. Therefore, Aiden thinks that Amelia thinks that Charlotte thinks that Isla thinks the lettuce is in the green_pantry. The answer is A. green_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_9/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b681982e11df0c92925ae411305ebcd8d951d597 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_9/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where is the apple really? +Answer: green_bottle +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To solve this question, we need to track the movements of each agent and their interactions. According to the story, Jack moved the apple to the green_bottle, but we don't know if he told anyone about it. However, we do know that no one else made any movements in the den or waiting room, so they couldn't have moved the apple. Therefore, the apple must still be in the green_bottle. The answer is D. green_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_9/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c0d90bd6b6037a7e14f874461a334f54fde3d485 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_9/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Jack really think the apple is? +Answer: green_bottle +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to look at the movements of each agent and their interactions. Jack moved the apple to the green_bottle and then exited the den. We don't have any information about Jack's interactions with other agents or his movements after he left the den. Therefore, based on the given information, we can assume that Jack really thinks the apple is in the green_bottle. The answer is D. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_9/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..565bf86b88f0f59042a3df860008b07d7ba0a6c0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_9/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Evelyn think Jack thinks the apple is? +Answer: green_bottle +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to determine where Jack moved the apple and who knows about it. According to the story, Jack moved the apple to the green_bottle and then exited the den. After that, no one else entered the den before the agents entered the waiting_room. Therefore, only Jack knows that the apple is in the green_bottle. However, Evelyn did not have any interactions with Jack, so she cannot know where Jack thinks the apple is. Therefore, the answer is not given in the story and cannot be determined. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_9/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f45d7d505fa50f90cd8bc481ddf16b2cd076c3ad --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_9/order_3.txt @@ -0,0 +1,44 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Ella think Evelyn thinks Jack thinks the apple is? +Answer: green_pantry +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: This question requires a bit of deduction and inference. We need to figure out where each agent thinks the apple is and who they trust. From the story, we know that Jack moved the apple to the green_bottle and then left the den. Therefore, Jack thinks the apple is in the green_bottle. + +Next, we need to figure out who knows where the apple is. We know that Evelyn stayed in the den and then the sunroom without making any movements, so she doesn't know where the apple is. Amelia stayed in the den and then the sunroom without making any movements, so she also doesn't know where the apple is. Ella stayed in the den for a minute without making any movements, so she doesn't know where the apple is either. + +Now, we need to figure out who trusts whom. According to the assumptions, agents tend to trust agents who exited the room later than themselves. We know that Jack exited the den before everyone else, so no one trusts him. We also know that Hannah exited the den last, so everyone trusts her. + +Finally, we need to figure out where each agent thinks the other agents think the apple is. Since no one knows where the apple is except for Jack, everyone else will have to make a guess. We don't have any information about where Hannah thinks the apple is, so we can't use her to help us. + +Evelyn doesn't know where the apple is, so she can't have an opinion on where Jack thinks it is. Amelia and Ella also don't know where the apple is, so they can't have an opinion on where Jack thinks it is either. However, we do know that Ella moved the onion to the red_pantry and publicly claimed that it was in the green_treasure_chest. We also know that Evelyn privately told Ella that the onion is in the red_pantry. Therefore, we can infer that Ella trusts Evelyn more than she trusts herself or Amelia. + +Since Jack moved the apple to the green_bottle, and we know that Ella trusts Evelyn more than herself or Amelia, we can assume that Ella thinks that Evelyn thinks that Jack thinks the apple is in the green_bottle. Therefore, the answer is D. green_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_9/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5bca6f6cec8fc8475918d6360d7601107c055d8f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_2/sample_9/order_4.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Amelia think Ella thinks Evelyn thinks Jack thinks the apple is? +Answer: green_pantry +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Amelia think Ella thinks Evelyn thinks Jack thinks the apple is? + +2. We know that Jack moved the apple to the green_bottle, but we need to determine where each agent thinks the apple is. + +3. We don't have any information about what Amelia thinks about the apple's location, so we need to work backwards from what she knows about Ella and Evelyn. + +4. We know that Ella publicly claimed that the onion is in the green_treasure_chest, but we need to determine if she made any public claims about the apple's location. + +5. We also know that Evelyn privately told Ella that the onion is in the red_pantry, but we don't have any information about what she told Ella about the apple's location. + +6. We know that Ella likes the green_bucket, but we don't have any information about how this relates to the apple's location. + +7. Based on the assumption that agents tend to trust those who exit a room later than themselves, we can assume that each agent trusts the information provided by the agents who exited the den and sunroom after them. + +8. Therefore, we can assume that Amelia trusts Jack's claim that the apple is in the green_bottle. + +9. We also know that each agent tends to lie, so we can't assume that any public or private claims about the apple's location are true. + +10. Based on this analysis, we can conclude that Amelia thinks that Ella thinks that Evelyn thinks that Jack thinks the apple is in the green_bottle. + +11. Therefore, the answer is D. green_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_1/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..203714c3f5cbc607b6feb5a9baa72c03544f4497 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_1/order_0.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where is the peas really? +Answer: green_bottle +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to follow the movements of the agents and their private and public interactions. According to the story, Emily publicly claimed that the peas is in the blue_suitcase, but Isabella privately told Logan that the peas is in the green_bottle. We also know that Logan tends to trust an agent that exited the room later than himself. Therefore, we can infer that the peas is actually in the green_bottle, which is where Isabella told Logan it was. + +The correct answer is M. green_bottle. + +a: \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_1/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fdf727716e6323ec467f4459604a3954b40e5a52 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_1/order_1.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Jack really think the peas is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to track Jack's movements and any interactions he had with other agents regarding the location of the peas. According to the story, Jack likes the blue_crate and he moved the peas from the blue_suitcase to the red_crate. However, there is no information about Jack's thoughts or any private or public interactions he had regarding the location of the peas after he moved them to the red_crate. Therefore, we cannot determine where Jack really thinks the peas is. The answer is not provided in the options given. + +a: \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_1/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ce959b16560ab6a2ea0b17a33d7f708a7e525fb2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_1/order_2.txt @@ -0,0 +1,60 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Jackson think Jack thinks the peas is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to track the movements of Jackson and Jack and their interactions with the peas. According to the story, Jackson made no movements in the hallway, but he dislikes turnips. Jack likes the blue crate and moved the peas from the blue suitcase to the red crate before exiting the hallway. Therefore, Jackson knows that Jack was in the hallway and had access to the peas. + +Later, Emily publicly claimed that the peas is in the blue suitcase, but Isabella privately told Logan that the peas is in the green bottle. Since Jackson did not hear Isabella's private conversation with Logan, he still believes that the peas is in the blue suitcase. + +After that, Isabella, Emily, Jack, and Logan entered the patio, and Isabella moved the cherry to the green envelope before exiting. Jack made no movements in the patio, so he did not have any interaction with the peas. Therefore, Jackson's belief about where Jack thinks the peas is should not change based on the events in the patio. + +Finally, Isabella privately told Emily that the cherry is in the blue cupboard, and Logan privately told Jackson the same thing. Since Jackson trusts Logan more than Isabella (since Logan exited the waiting room after Jackson), he should believe that the cherry is in the blue cupboard. However, this information does not affect his belief about where Jack thinks the peas is. + +Therefore, the answer to the question is A. blue_crate, since that is where Jack moved the peas to before exiting the hallway, and Jackson has no reason to believe that Jack's belief about the location of the peas has changed. + +a: 1 6 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_1/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ff6eda86064d7b7ddda3098f4fc2ee54211a26e4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_1/order_3.txt @@ -0,0 +1,74 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Logan think Jackson thinks Jack thinks the peas is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: This is a complex question that requires careful analysis of the story and the assumptions. To break it down: + +- We are looking for Logan's belief about Jackson's belief about Jack's belief about the location of the peas. +- Logan's belief about Jackson's belief is based on what Jackson publicly claims or privately tells Logan. +- Jackson's belief about Jack's belief is not directly stated in the story, so we need to infer it based on the available information. + +To solve the question, we need to trace the information about the peas and the movements of the agents: + +- The peas is initially in the blue_suitcase (step 2). +- Jack likes the blue_crate (step 6). +- Jack moves the peas to the red_crate (step 8). +- Emily moves the peas to the green_bottle (step 10). +- Emily publicly claims that peas is in the blue_suitcase (step 16). +- Isabella privately tells Logan that the peas is in the green_bottle (step 17). + +Based on this information, we can infer that: + +- Jack initially thinks the peas is in the blue_suitcase (since it's the starting location and he hasn't moved it yet). +- Emily thinks the peas is in the green_bottle (since she moved it there and publicly claimed it). +- Isabella knows that the peas is in the green_bottle (since she privately told Logan). +- Jackson's belief about Jack's belief is not directly stated, but we can make some assumptions based on the available information. Since Jack likes the blue_crate and initially thinks the peas is in the blue_suitcase, it's possible that Jackson thinks Jack still believes the peas is in the blue_suitcase or has moved it to the blue_crate (since he likes it). However, we cannot be certain about this. + +Now we need to find where Logan thinks Jackson thinks Jack thinks the peas is. We know that Logan privately told Jackson that the cherry is in the blue_cupboard (step 41), but this doesn't give us any information about the peas. We also know that Logan exited the attic after Isabella moved the potato to the red_basket (step 21), so he trusts Isabella more than Emily or Jack. Therefore, he might believe that Jackson trusts Isabella more as well. Since Isabella privately told Logan that the peas is in the green_bottle, Logan might think that Jackson believes Jack thinks the peas is in the green_bottle (since Isabella's information is more reliable). Therefore, the answer is M. green_bottle. + +a: 6 5 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_1/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad951c937ba0015a5bb9177d1073a5df163d39e5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_1/order_4.txt @@ -0,0 +1,84 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Isabella think Logan thinks Jackson thinks Jack thinks the peas is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: This is a complex question that requires careful analysis of the story and the assumptions. We need to track the movements and thoughts of each character and their interactions with each other. + +First, we need to identify the chain of thoughts that Isabella is thinking about. According to the question, Isabella is thinking about what Logan thinks Jackson thinks Jack thinks about the peas. + +We know that Emily publicly claimed that the peas is in the blue_suitcase, but we also know that the characters tend to lie. Isabella privately told Logan that the peas is in the green_bottle, so we can assume that she knows the true location of the peas. + +Logan privately told Jackson that the cherry is in the blue_cupboard, but we don't know if Jackson trusts Logan's information. We also don't know if Jack or Emily have any information about the location of the peas. + +Based on the story, we know that Jack likes the blue_crate and moved the peas to the red_crate. However, we also know that Jack tends to lie, so we can't be sure if the peas is actually in the red_crate. + +Isabella moved the potato to the red_basket, but we don't have any information about her thoughts on the location of the peas. + +Therefore, we need to look for clues about what Logan, Jackson, and Jack might think about the location of the peas. Logan made no movements in the hallway and exited before Jackson, so Jackson might trust Logan's information more than Jack's or Emily's. + +Logan moved the potato to the blue_crate in the attic, but we don't know if he has any information about the location of the peas. + +Based on these clues, we can eliminate some of the answer choices. The peas is not in the green_drawer, green_bathtub, green_pantry, red_envelope, red_bucket, or red_pantry, because there is no evidence to suggest that any character has any information about these locations. + +The peas is also not in the blue_suitcase, because we know that Isabella privately told Logan that the peas is in the green_bottle. + +The peas is not in the red_crate, because we don't know if Jack was telling the truth when he moved the peas to the red_crate. + +The peas is not in the blue_drawer, because there is no evidence to suggest that any character has any information about this location. + +This leaves us with three possible answer choices: green_bottle, blue_cupboard, and green_envelope. + +Isabella privately told Logan that the peas is in the green_bottle, but we don't know if Logan trusts Isabella's information. + +Logan privately told Jackson that the cherry is in the blue_cupboard, but we don't know if Jackson trusts Logan's information. + +Isabella moved the cherry to the green_envelope, but we don't know if she has any information about the location of the peas. + +Therefore, we cannot determine where Isabella thinks Logan thinks Jackson thinks Jack thinks the peas is. The answer is unknown. + +a: 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_10/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..cbe3c40a70f0a9528edba648b2419d121188a2d4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_10/order_0.txt @@ -0,0 +1,62 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where is the persimmon really? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: To determine the location of the persimmon, we need to track its movements based on the story and assumptions given. + +1. The persimmon is initially in the green_bathtub (statement 3). +2. Emily moves the persimmon to the red_envelope (statement 5). +3. Mila moves the persimmon to the green_box (statement 7). +4. Benjamin moves the persimmon to the red_pantry (statement 10). +5. Therefore, the persimmon is really in the red_pantry (option D). + +The answer is D. red_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_10/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3c294d3985dcb09109e9e0f360464d8a37662946 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_10/order_1.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Mila really think the persimmon is? +Answer: green_bucket +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: To determine where Mila really thinks the persimmon is, we need to follow Mila's movements and any private or public interactions she had with other agents. Mila initially liked the red_envelope, but Emily moved the persimmon to the red_envelope. Mila then moved the persimmon to the green_box before exiting the back_yard. In the waiting_room, Emma publicly claimed that the persimmon is in the green_bucket, but Charlotte privately told Emily that the persimmon is in the green_bathtub. Mila then entered the garden with Charlotte and Emma, but made no movements and exited after a minute. Mila then moved the eggplant to the blue_cupboard before entering the waiting_room with Charlotte and Emma. + +Based on Mila's movements and interactions, we can infer that Mila thinks the persimmon is in the green_box, as that was the last place she moved it to before exiting the back-yard. Therefore, the answer is C. green_box. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_10/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d98bf827b6bccbb7bd6480833171f673b9d6a2c3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_10/order_2.txt @@ -0,0 +1,60 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Emily think Mila thinks the persimmon is? +Answer: red_envelope +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: To answer this question, we need to track the movements of Emily and Mila regarding the persimmon. According to the story, Emily moved the persimmon to the red_envelope, and Mila later moved it to the green_box. However, we don't know what Mila thinks about the location of the persimmon. + +We can infer that Emily trusts Benjamin more than Mila because Benjamin exited the back_yard after Emily. Therefore, Emily might believe Benjamin's claim about the location of the persimmon more than Mila's claim. + +However, we also know that agents tend to lie, so we cannot be sure about anyone's claim. Therefore, we cannot determine where Emily thinks Mila thinks the persimmon is. + +The answer is: Cannot be determined. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_10/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b5a973a7b7ca5aef53e3da1e4ad21a4a93cd7fac --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_10/order_3.txt @@ -0,0 +1,64 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Charlotte think Emily thinks Mila thinks the persimmon is? +Answer: red_envelope +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: To answer this question, we need to trace the movements of the persimmon and the interactions between the characters. + +According to the story, the persimmon was initially in the green_bathtub (step 3), then Emily moved it to the red_envelope (step 5), Mila moved it to the green_box (step 7), Benjamin moved it to the red_pantry (step 10), and finally Charlotte moved it back to the green_bathtub (step 15). + +There is no direct interaction between Emily and Mila regarding the persimmon, so we need to look for any indirect interactions. The only interaction that involves both Emily and Mila is step 4, where Mila likes the red_envelope. However, this does not give us any information about the persimmon's location. + +Next, we need to consider Charlotte's interactions. In step 19, Charlotte privately told Emily that the persimmon is in the green_bathtub. This means that Charlotte knows the persimmon's location, and she also knows that Emily knows it. However, we don't know if Charlotte has any information about Mila's thoughts on the persimmon's location. + +To find out where Charlotte thinks Emily thinks Mila thinks the persimmon is, we need to look for any interactions between Charlotte and Mila that might give us a clue. The only interaction between them is step 20, where they both enter the garden with Emma. However, there is no mention of any communication or interaction between Charlotte and Mila in this step. + +Therefore, we cannot determine where Charlotte thinks Emily thinks Mila thinks the persimmon is based on the given information. The answer is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_10/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..fbd472d391a4eeed595f31a8d80f85cdc56650cc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_10/order_4.txt @@ -0,0 +1,94 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Benjamin think Charlotte thinks Emily thinks Mila thinks the persimmon is? +Answer: red_envelope +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Benjamin moved the persimmon to the red_pantry (step 10). +2. Emily privately told Benjamin that the apple is in the green_bottle (step 45). +3. We need to find out where Benjamin thinks Charlotte thinks Emily thinks Mila thinks the persimmon is. + +To answer this question, we need to trace the movements of each character and their interactions with each other. Here's what we know: + +- Emily moved the persimmon to the red_envelope (step 5). +- Mila moved the persimmon to the green_box (step 7). +- Charlotte moved the persimmon to the green_bathtub (step 15). +- Emma publicly claimed that persimmon is in the green_bucket (step 18). + +Based on these movements, we can infer that: + +- Emily knows the persimmon was originally in the green_bathtub (step 3) and moved it to the red_envelope (step 5). +- Mila moved the persimmon from the red_envelope to the green_box (step 7). +- Charlotte moved the persimmon from the green_box to the green_bathtub (step 15). +- Emma falsely claimed that the persimmon was in the green_bucket (step 18). + +Now, let's apply the assumptions given in the question: + +- Benjamin knows that Charlotte exited the back_yard after Mila (step 9) and saw her in the waiting_room (step 17). +- Benjamin knows that Emily privately told him where the apple is (step 45). +- Benjamin knows that Charlotte publicly claimed that the apple is in the blue_cupboard (step 43). + +Based on these assumptions, we can infer that: + +- Benjamin trusts Charlotte more than Emma, since Charlotte exited the back_yard after Emma (step 8) and Benjamin exited after Charlotte (step 12). +- Benjamin knows that Emily moved the persimmon to the red_envelope (step 5) and that Mila moved it to the green_box (step 7). +- Benjamin knows that Charlotte moved the persimmon to the green_bathtub (step 15). +- Benjamin knows that Mila exited the back_yard before Charlotte (step 9) and that Charlotte saw Emily privately (step 19). + +Putting all of this together, we can conclude that: + +- Benjamin thinks that Mila thinks the persimmon is in the green_box (where she left it). +- Emily knows that the persimmon is actually in the green_bathtub (where Charlotte moved it). +- Charlotte publicly claimed that the apple is in the blue_cupboard (which Benjamin knows). +- Therefore, Benjamin thinks that Charlotte thinks Emily thinks the persimmon is in the green_box (where Mila left it), but he knows that it's actually in the green_bathtub (where Charlotte moved it). + +So the answer is C. green_box. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_11/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..deb118820101d4beb8c4af25e8cd1e37da2e9f58 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_11/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where is the spinach really? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: Based on the story and assumptions, we know that Isla moved the spinach to the green_pantry and Abigail dislikes the spinach. Therefore, the correct answer is F. green_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_11/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f5fe969bd61ab18c5371692dc0c0ff284b43de95 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_11/order_1.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Abigail really think the spinach is? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: To answer this question, we need to track Abigail's movements and interactions with other agents. According to the story, Abigail entered the sunroom with four other agents, made no movements, and stayed there for one minute before exiting. She then entered the waiting room with the same four agents, before moving to the patio with Isla and Jack. Abigail made no movements in the patio and stayed there for one minute before exiting. + +There is no mention of Abigail interacting with the spinach or expressing any thoughts about it while in the sunroom or the waiting room. However, we do know that Abigail dislikes spinach, and Isla moved the spinach to the green_pantry. + +Therefore, based on the given assumptions, we can infer that Abigail thinks the spinach is in the green_pantry, despite not publicly claiming it. The correct answer is F. green_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_11/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b58523ecda658072d1d2074bdeb7cbbe74f69516 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_11/order_2.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Benjamin think Abigail thinks the spinach is? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: To answer this question, we need to track the movements and interactions of Benjamin and Abigail. According to the story, Abigail made no movements in the sunroom and then exited, while Benjamin made no movements in the sunroom and then exited. Therefore, they were both in the sunroom at the same time, but did not interact with each other. Later, Abigail, Isla, and Jack entered the patio, but Benjamin was not mentioned to be there. Therefore, Benjamin did not witness Abigail's interaction with Isla and Jack in the patio. + +The only information we have about Abigail's thoughts on the spinach is that she dislikes it. We also know that Isla moved the spinach to the green_pantry after Abigail exited the sunroom. However, Benjamin was not present for either of these events. Therefore, we cannot determine where Benjamin thinks Abigail thinks the spinach is. + +The answer is not provided in the multiple-choice options. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_11/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..39d699f094729110d6b6c796d451a0d6e9634f58 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_11/order_3.txt @@ -0,0 +1,53 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Jack think Benjamin thinks Abigail thinks the spinach is? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: To answer this question, we need to trace Jack's thoughts and assumptions. According to the story, Jack publicly claimed that the spinach is in the green_pantry (step 15). However, Isla privately told Jack that the spinach is in the blue_suitcase (step 16). Therefore, Jack knows that the spinach is not in the green_pantry, but he may or may not know where it actually is. + +We also know that Benjamin, Isla, Amelia, and Jack entered the front_yard (step 26), and Benjamin made no movements and stayed in the front_yard for 1 minute (step 28). Therefore, Jack exited the front_yard later than Benjamin, and he may trust Benjamin's judgment more than his own. + +However, we don't have any information about where Abigail thinks the spinach is. Therefore, we cannot determine where Jack thinks Benjamin thinks Abigail thinks the spinach is. + +The answer is: Cannot be determined. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_11/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8db3bf594ddb0294ca15d18050f08f7b796e1467 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_11/order_4.txt @@ -0,0 +1,71 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Amelia think Jack thinks Benjamin thinks Abigail thinks the spinach is? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Where does Amelia think Jack thinks Benjamin thinks Abigail thinks the spinach is? + +We need to determine the location of the spinach based on the story. According to step 2, the spinach is in the green_pantry. However, we also know from step 11 that Abigail dislikes spinach. This information is important because it tells us that Abigail is unlikely to have moved the spinach to the green_pantry herself. + +2. Who knows where the spinach is located? + +We know that Isla moved the spinach to the green_pantry (step 12), but only Jack knows this information because Isla privately told him (step 16). Therefore, Amelia does not know where the spinach is located. + +3. What does Jack think about the location of the spinach? + +Jack publicly claimed that the spinach is in the green_pantry (step 15), but we know that he actually knows it is in the blue_suitcase (step 16). Therefore, Jack thinks the spinach is in the blue_suitcase. + +4. What does Benjamin think about the location of the spinach? + +There is no information in the story to suggest what Benjamin thinks about the location of the spinach. + +5. What does Abigail think about the location of the spinach? + +There is no information in the story to suggest what Abigail thinks about the location of the spinach. + +6. Putting it all together + +Amelia thinks that Jack thinks Benjamin thinks Abigail thinks the spinach is in the green_pantry (option F). However, we know that Jack actually thinks the spinach is in the blue_suitcase (option J). Therefore, the correct answer is J. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_12/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8aa936a8968cce473949a7f79942ef1b8ab44117 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_12/order_0.txt @@ -0,0 +1,53 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where is the spinach really? +Answer: green_pantry +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: To answer this question, we need to track the movements of the agents and their private and public interactions related to the spinach. According to the story, Isabella, Avery, Hannah, Noah, and Nathan entered the dining room. Isabella made no movements and stayed in the dining room for 1 minute before exiting. Avery moved the spinach to the red crate and then exited the dining room. Hannah moved the spinach to the green cupboard and then exited the dining room. Finally, Nathan moved the spinach to the green pantry and then exited the dining room. + +Later, Hannah privately told Isabella that the spinach is in the green cupboard, and Avery privately told Noah that the spinach is in the green pantry. Isabella publicly claimed that the cherry is in the green pantry, but we cannot trust her claim as the agents tend to lie. + +Therefore, based on the movements and interactions of the agents, we can conclude that the spinach is actually in the green pantry (option L). \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_12/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fdee5eeaa3f4a29fe9bf82520d49a02df671ab36 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_12/order_1.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Avery really think the spinach is? +Answer: green_pantry +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: To answer this question, we need to look for any private interactions that Avery had with other agents regarding the location of the spinach. According to the story, Avery privately told Noah that the spinach is in the green_pantry. Therefore, the correct answer is L. green_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_12/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..14bd86e7d28bba90e9c1d71be95d2b86cef0449a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_12/order_2.txt @@ -0,0 +1,68 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Hannah think Avery thinks the spinach is? +Answer: red_crate +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: To answer this question, we need to track the movements of Hannah and Avery and their private communication. + +1. Isabella, Avery, Hannah, Noah, and Nathan entered the dining room. +2. The spinach is in the green pantry. +3. Isabella made no movements and stayed in the dining room for 1 minute. +4. Isabella exited the dining room. +5. Avery moved the spinach to the red crate. +6. Avery exited the dining room. +7. Hannah moved the spinach to the green cupboard. +8. Hannah exited the dining room. +13. Isabella, Avery, Hannah, Noah, and Nathan entered the waiting room. +15. Hannah privately told Isabella that the spinach is in the green cupboard. +16. Avery privately told Noah that the spinach is in the green pantry. +26. Avery, Noah, and Hannah entered the waiting room. +39. Isabella publicly claimed that the cherry is in the green pantry. +40. Avery privately told Hannah that the cherry is in the green box. + +From the story, we know that Hannah moved the spinach to the green cupboard and privately told Isabella about it. Avery moved the spinach to the red crate and privately told Noah that the spinach is in the green pantry. Hannah did not witness Avery's movement, but she knows that Avery exited the dining room after her. Therefore, she would trust Avery more than Noah. + +So, Hannah would think that Avery thinks the spinach is in the green pantry, which is the answer choice (E). \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_12/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9e1a975db280e471a2d3c08802401518031b0adb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_12/order_3.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Isabella think Hannah thinks Avery thinks the spinach is? +Answer: green_pantry +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: To answer this question, we need to trace the movements and interactions of Isabella, Hannah, and Avery regarding the spinach. Isabella did not move the spinach, but she knows that Avery moved it to the red crate and Hannah moved it to the green cupboard. Hannah privately told Isabella that the spinach is in the green cupboard, and Avery privately told Noah that the spinach is in the green pantry. Isabella publicly claimed that the cherry is in the green pantry. + +Based on these movements and interactions, we can infer that Isabella thinks Hannah thinks Avery thinks the spinach is in the green pantry. Therefore, the answer is D. green_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_12/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..05833416adc5eb188bb099a27b8e78fb0617394f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_12/order_4.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Nathan think Isabella thinks Hannah thinks Avery thinks the spinach is? +Answer: green_pantry +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Nathan moved the spinach to the green_pantry (step 11). +2. Isabella privately told Hannah that the spinach is in the green_cupboard (step 15). +3. Avery privately told Noah that the spinach is in the green_pantry (step 16). +4. Hannah moved the spinach to the green_cupboard (step 7). + +Based on these steps, we can infer that Nathan thinks Isabella thinks Hannah thinks Avery thinks the spinach is in the green_cupboard. Therefore, the answer is O. green_cupboard. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_13/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..950680dc9db5966d9b14dcdc3329fe635636b74d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_13/order_0.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where is the onion really? +Answer: green_crate +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: To answer this question, we need to follow the movements of the onion and the agents. According to the story, the onion was initially in the green_crate (statement 4). Then, Lily moved the onion to the blue_bucket (statement 11), but later Abigail moved it to the red_bucket (statement 29). Finally, Emily moved the onion back to the green_crate (statement 35). + +Mila privately told Jack that the onion is in the green_crate (statement 39), which means that the onion is really in the green_crate. Therefore, the answer is B. green_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_13/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..640af8cc7ad44382912d2765fa380432a47eb763 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_13/order_1.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Mila really think the onion is? +Answer: red_bucket +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: To answer this question, we need to track Mila's movements and interactions with other agents. Mila saw a cat and then entered the master_bedroom with Jack, Abigail, Emily, and Lily. She made no movements and stayed in the master_bedroom for 1 minute before exiting. She then entered the waiting_room with the others. Later, Mila moved the pear to the green_pantry and exited the porch. + +In the master_bedroom, Lily publicly claimed that the onion is in the blue_bucket, but Mila privately told Jack that the onion is in the blue_bucket. However, when Abigail, Lily, Mila, and Emily re-entered the master_bedroom, Abigail moved the onion to the red_bucket. + +Finally, Emily privately told Jack that the onion is in the green_crate. + +Based on this information, Mila's private communication with Jack suggests that she thinks the onion is in the blue_bucket. However, since Abigail moved the onion to the red_bucket and Emily told Jack that the onion is in the green_crate, it's unclear where the onion actually is. + +Therefore, the answer is not listed among the options given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_13/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..320d51c642d5993d99ab45c42e3a7c892bfd0585 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_13/order_2.txt @@ -0,0 +1,96 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Abigail think Mila thinks the onion is? +Answer: red_bucket +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: To answer this question, we need to track the movements of Abigail and Mila and their interactions with each other. + +1. Mila saw a cat. (Irrelevant to the question) +2. Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3. Emily lost his watch. (Irrelevant to the question) +4. The onion is in the green_crate. +5. Jack made no movements and stayed in the master_bedroom for 1 minute. +6. Jack exited the master_bedroom. +7. Abigail made no movements and stayed in the master_bedroom for 1 minute. +8. Abigail exited the master_bedroom. +9. Emily made no movements and stayed in the master_bedroom for 1 minute. +10. Emily exited the master_bedroom. +11. Lily moved the onion to the blue_bucket. +12. Lily exited the master_bedroom. +13. Mila made no movements and stayed in the master_bedroom for 1 minute. +14. Mila exited the master_bedroom. +15. Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16. Lily publicly claimed that onion is in the blue_bucket. +17. Mila privately told Jack that the onion is in the blue_bucket. +18. Mila, Abigail and Emily entered the porch. +19. The pear is in the red_bottle. +20. Mila moved the pear to the green_pantry. +21. Mila exited the porch. +22. Abigail moved the pear to the green_basket. +23. Abigail exited the porch. +24. Emily made no movements and stayed in the porch for 1 minute. +25. Emily exited the porch. +26. Mila, Abigail and Emily entered the waiting_room. +27. Abigail, Lily, Mila and Emily entered the master_bedroom. +28. The onion is in the blue_bucket. +29. Abigail moved the onion to the red_bucket. +30. Abigail exited the master_bedroom. +31. Lily made no movements and stayed in the master_bedroom for 1 minute. +32. Lily exited the master_bedroom. +33. Mila made no movements and stayed in the master_bedroom for 1 minute. +34. Mila exited the master_bedroom. +35. Emily moved the onion to the green_crate. +36. Emily exited the master_bedroom. +37. Abigail, Lily, Mila and Emily entered the waiting_room. +38. Lily privately told Mila that the onion is in the green_crate. +39. Emily privately told Jack that the onion is in the green_crate. + +Based on the assumption that Abigail tends to lie, we cannot trust her public claim that the onion is in the red_bucket. We need to look for any private interactions she had with Mila. + +From step 18, we know that Abigail and Mila were together in the porch. However, there is no mention of them discussing the location of the onion. + +From step 26, we know that Abigail, Lily, Mila, and Emily were together in the waiting_room. Again, there is no mention of Abigail and Mila discussing the onion. + +Therefore, we cannot determine where Abigail thinks Mila thinks the onion is. The answer is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_13/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a6ab3181b6f47a0413476367a76e95775fc0d64b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_13/order_3.txt @@ -0,0 +1,80 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Jack think Abigail thinks Mila thinks the onion is? +Answer: green_crate +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: This is a complex question that requires careful analysis of the story and the assumptions given. To break it down: + +- We are looking for Jack's belief about Abigail's belief about Mila's belief about the location of the onion. +- We need to consider the movements and interactions of each character to determine their possible beliefs about the onion's location. +- We also need to keep in mind that characters may lie and that trust is based on exit order. + +Step-by-step analysis: + +- Mila saw the cat, which is not relevant to the question. +- Jack, Abigail, Emily, Lily, and Mila entered the master bedroom. Emily lost his watch, which is not relevant to the question. +- The onion is in the green crate, but no one knows this yet. +- Jack stayed in the master bedroom for one minute and then exited. Abigail did the same. Emily and Mila also stayed in the master bedroom for one minute each before exiting. +- Lily moved the onion to the blue bucket after everyone else had left the master bedroom. +- Mila privately told Jack that the onion is in the blue bucket, but this is a lie. +- Abigail publicly claimed that the onion is in the blue bucket, which is also a lie. +- Mila, Abigail, and Emily entered the porch. The pear is in the red bottle, but this is not relevant to the question. +- Mila moved the pear to the green pantry and then exited. Abigail moved the pear to the green basket and then exited. Emily stayed in the porch for one minute before exiting. +- Abigail, Lily, Mila, and Emily entered the master bedroom. The onion is in the blue bucket, but this is a lie. +- Abigail moved the onion to the red bucket and then exited. Lily stayed in the master bedroom for one minute before exiting. Mila also stayed in the master bedroom for one minute before exiting. +- Emily moved the onion to the green crate and then exited. +- Lily privately told Mila that the onion is in the green crate, which is the truth. +- Emily privately told Jack that the onion is in the green crate, which is also the truth. + +Based on this analysis, we can determine the following beliefs: + +- Jack knows that the onion is in the green crate because Emily told him. +- Abigail knows that the onion is not in the blue bucket because she moved it to the red bucket. +- Mila knows that the onion is not in the blue bucket because she moved the pear to the green pantry and saw that the onion was not there. +- Abigail, Lily, and Mila all know that the onion is not in the red bucket because Abigail moved it there and they were all present. +- Abigail, Lily, and Mila all know that the onion is not in the blue bucket because they were all present when Lily moved it to the blue bucket. +- Jack does not know where Abigail thinks Mila thinks the onion is because there is no information about their beliefs or interactions regarding the onion. + +Therefore, the answer is none of the above. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_13/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..468902772953bc2bd4215391c2183cb6130e0760 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_13/order_4.txt @@ -0,0 +1,64 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Emily think Jack thinks Abigail thinks Mila thinks the onion is? +Answer: green_crate +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. We need to find out where Emily thinks Jack thinks Abigail thinks Mila thinks the onion is. +2. According to the story, Mila privately told Jack that the onion is in the blue_bucket, but Lily publicly claimed that the onion is in the blue_bucket. +3. Abigail later moved the onion to the red_bucket, but Emily moved it to the green_crate. +4. We know that agents tend to lie, so we cannot trust what they say. +5. We also know that agents tend to trust those who exited the room later than themselves. + +Based on these assumptions, we can make the following deductions: + +1. Emily knows that Jack was in the master_bedroom when Lily claimed that the onion is in the blue_bucket. +2. Emily also knows that Abigail moved the onion to the red_bucket, but she cannot be sure if Jack knows this. +3. Mila privately told Jack that the onion is in the blue_bucket, but Emily cannot be sure if Jack believes her. +4. Emily moved the onion to the green_crate, so she knows where it actually is. +5. Emily cannot be sure what Abigail, Lily, or Mila actually think about the onion's location. + +Therefore, the answer to the question is B. green_crate, because that is where Emily knows the onion actually is, and she cannot be sure what Jack, Abigail, or Mila actually think about its location. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_14/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..42bcea3521fa550c480af5eb91766e003e2c3a47 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_14/order_0.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where is the carrot really? +Answer: green_crate +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: To solve this question, we need to track the movements of the carrot and the statements made by the characters. According to the story, the carrot was initially in the red envelope (statement 3). Isabella moved it to the red container (statement 11) and then Abigail moved it back to the red envelope (statement 13). Later, Emma moved the carrot to the red drawer (statement 30). Isabella privately told Nathan that the carrot is in the green crate (statement 40). However, we know that the characters tend to lie, so we cannot trust this statement completely. + +Therefore, the correct answer is L. red_envelope, as that is the last known location of the carrot according to the story. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_14/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e17eee33bf79ed1586ff54fd7b24d4025aa32a29 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_14/order_1.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Abigail really think the carrot is? +Answer: red_drawer +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: To answer this question, we need to look for any private interactions Abigail had with other agents regarding the location of the carrot. According to the story, Abigail privately told Nathan that the carrot is in the red_envelope (step 17). Therefore, the correct answer is L. red_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_14/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9a5efc756849504a6773b32338182a2b221ac241 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_14/order_2.txt @@ -0,0 +1,53 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Nathan think Abigail thinks the carrot is? +Answer: red_envelope +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: To answer this question, we need to track the movements and interactions of Nathan and Abigail regarding the carrot. According to the story, Abigail moved the carrot to the red_envelope and privately told Nathan about it. Later, Isabella moved the carrot to the green_crate and privately told Nathan about it. However, we are only concerned with Abigail's movements and Nathan's thoughts about her belief. + +Based on the assumption that an agent tends to trust another agent who exited the room later than himself, we know that Nathan exited the front_yard before Abigail. Therefore, he may not fully trust her belief about the carrot's location. However, we also know that Abigail privately told Nathan that the carrot is in the red_envelope, so he may still consider that as a possibility. + +Therefore, the answer to the question is L. red_envelope, as that is where Abigail believes the carrot is, and Nathan may also consider that as a possibility based on their private interaction. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_14/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7801608a203d3a4aa25253709f824a56b0c22ef8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_14/order_3.txt @@ -0,0 +1,67 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Avery think Nathan thinks Abigail thinks the carrot is? +Answer: red_envelope +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. We need to find out where Avery thinks Nathan thinks Abigail thinks the carrot is. This means we need to trace the path of the carrot and who knows where it is. + +2. According to step 3, we know that the carrot is in the red_envelope. This is public knowledge because Isabella publicly claimed it in step 16. + +3. In step 17, Abigail privately told Nathan that the carrot is in the red_envelope. This means that Nathan knows where the carrot is. + +4. We need to figure out where Abigail thinks the carrot is. According to step 13, Abigail moved the carrot to the red_envelope. This means that Abigail knows where the carrot is. + +5. Now we need to figure out where Avery thinks Abigail thinks the carrot is. We know that Avery saw a dog in step 6 and made no movements in the front_yard in steps 9 and 10. This means that Avery did not witness the movement of the carrot in steps 11, 13, 29, or 36. + +6. However, Avery did witness the movement of the eggplant in steps 23 and 25. This means that Avery knows where the eggplant is, but not necessarily where the carrot is. + +7. We need to look for any interactions between Avery and Abigail that might give us a clue. According to step 18, Emma, Avery, and Abigail entered the lounge together. However, there is no mention of any private or public interactions between Avery and Abigail. + +8. We also need to consider the exit order. According to assumption 4, agents tend to trust agents that exited the room later than themselves. In step 10, Avery exited the front_yard after Nathan. This means that Avery might trust Nathan's knowledge of the carrot's location more than Abigail's. + +9. Putting all of this together, we can conclude that Avery might think that Abigail thinks the carrot is in the red_envelope, based on the fact that Isabella publicly claimed it in step 16 and Abigail privately told Nathan in step 17. However, there is no definitive answer to this question based on the information given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_14/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..409f8223c7b5d18a972084b2ebcfd8bc8ad9c3dd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_14/order_4.txt @@ -0,0 +1,61 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Isabella think Avery thinks Nathan thinks Abigail thinks the carrot is? +Answer: red_envelope +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. To break it down, we need to identify the chain of thoughts that Isabella is supposed to be thinking about. According to the question, Isabella is thinking about what Avery thinks Nathan thinks Abigail thinks about the location of the carrot. + +To solve this question, we need to work backwards from Isabella's thoughts to determine where the carrot is located. We know from step 40 that Isabella privately told Nathan that the carrot is in the green_crate. Therefore, we can assume that Isabella thinks the carrot is in the green_crate. + +Next, we need to determine what Avery thinks about the location of the carrot. We know from step 25 that Abigail moved the eggplant to the green_basket, and from step 26 that Abigail exited the lounge. Therefore, Avery would have seen the eggplant in the green_basket before exiting the lounge. However, we don't have any information about what Avery thinks about the location of the carrot. + +Moving on to Nathan, we know from step 19 that he saw a cat, but we don't have any information about what he thinks about the location of the carrot. + +Finally, we come to Abigail. We know from step 17 that Abigail privately told Nathan that the carrot is in the red_envelope. However, we also know from step 13 that Abigail moved the carrot to the red_envelope before exiting the front_yard. Therefore, we can assume that Abigail thinks the carrot is in the red_envelope. + +Putting it all together, Isabella thinks that Abigail thinks the carrot is in the red_envelope. We don't have any information about what Isabella thinks Avery thinks Nathan thinks about the location of the carrot, so we can't answer the question as it is currently phrased. + +Therefore, the answer is not provided in the options given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_15/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f6d343a620ed1db6090a02a8fb8bd9a17a605da1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_15/order_0.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where is the peach really? +Answer: red_pantry +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: To answer this question, we need to track the movements of the peach and the statements made by the agents. According to the story, the peach was initially in the red_bucket (line 2). Aiden moved the peach to the red_pantry (line 6) and later privately told Sophia that the peach is in the red_envelope (line 16). However, we know that agents tend to lie, so we cannot trust this statement. Benjamin privately told Abigail that the peach is in the red_pantry (line 15) and later moved the peach to the red_crate (line 19). Abigail moved the peach to the red_pantry again (line 24) and later moved the plum to the green_cupboard (line 35). Therefore, the peach is in the red_pantry (option N). + +The answer is N. red_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_15/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c89d0e75c9c360d0d96fe65ae626fe423d8add16 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_15/order_1.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Abigail really think the peach is? +Answer: red_pantry +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: To answer this question, we need to track Abigail's movements and any private or public interactions she had regarding the peach. According to the story, Abigail made no movements when the peach was initially in the red_bucket, and she exited the hallway before Aiden moved the peach to the red_pantry. Later, when Benjamin privately told her that the peach is in the red_pantry, she made no movements and exited the hallway. Therefore, based on the given assumptions, we can infer that Abigail did not have any private or public interactions regarding the peach after Benjamin told her its location. So, Abigail really thinks that the peach is in the red_pantry. The answer is N. red_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_15/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f5f957388fc5d59ec8cf38fa6ffbff6f9ff57f5b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_15/order_2.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Sophia think Abigail thinks the peach is? +Answer: red_bucket +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: To answer this question, we need to trace the movements of Abigail and Aiden with respect to the peach. Abigail made no movements when the peach was in the red_bucket, but Aiden moved it to the red_pantry and privately told Sophia that the peach is in the red_envelope. Later, Abigail moved the peach to the red_pantry again. Therefore, Sophia would think that Abigail thinks the peach is in the red_pantry (option N). + +The answer is N. red_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_15/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b57a86c5230735b583fc3f1c8464258dc2451006 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_15/order_3.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Aiden think Sophia thinks Abigail thinks the peach is? +Answer: red_bucket +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: To solve this question, we need to trace Aiden's thoughts and actions. Aiden moved the peach to the red_pantry and privately told Sophia that the peach is in the red_envelope. We also know that Abigail moved the peach to the red_pantry later on. However, we don't have any information about Sophia's thoughts or actions regarding the peach. + +Therefore, we cannot determine where Aiden thinks Sophia thinks Abigail thinks the peach is. The answer is not provided in the given story and assumptions. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_15/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ab792a0387a47617aef258ed429ce13820b9d553 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_15/order_4.txt @@ -0,0 +1,62 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Isla think Aiden thinks Sophia thinks Abigail thinks the peach is? +Answer: red_bucket +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: This is a complex question that requires careful analysis of the story and the assumptions. To break it down, we need to identify the agents involved and their interactions: + +- Isla: moved the peach to the red_bucket, then moved the plum to the red_pantry, and publicly claimed that the plum is in the red_bucket. +- Aiden: likes the red_crate, privately told Sophia that the peach is in the red_envelope, and made no movements in the hallway. +- Sophia: received information from Aiden, but we don't know what she thinks about the peach. +- Abigail: made no movements in the hallway, saw a monkey, moved the plum to the green_cupboard, and moved the peach to the red_pantry. +- Benjamin: made no movements in the hallway, privately told Abigail that the peach is in the red_pantry, moved the peach to the red_crate, privately told Sophia that the plum is in the green_cupboard, and dislikes the watermelon. + +Based on these interactions, we can eliminate some options that are not relevant to the question, such as blue and green containers, and focus on the red ones. We also need to consider the trust relationships between the agents, which are based on the exit order. Isla exited the hallway before Aiden, so she trusts him more than Benjamin or Abigail. However, she has no direct interaction with Sophia, so she cannot infer her thoughts unless Aiden tells her. + +To answer the question, we need to follow the chain of thoughts from Isla to Aiden to Sophia to Abigail to the peach location. Isla thinks that the plum is in the red_bucket, but that's not relevant to the peach. Aiden privately told Sophia that the peach is in the red_envelope, but we don't know what Sophia thinks about it. Abigail moved the peach to the red_pantry, but that's not where Isla thinks Aiden thinks Sophia thinks Abigail thinks the peach is. Benjamin privately told Abigail that the peach is in the red_pantry, but Isla doesn't trust him as much as Aiden. Therefore, the only option left is the one that Aiden likes: the red_crate. Isla thinks that Aiden thinks Sophia thinks Abigail thinks the peach is in the red_crate. + +The answer is B. blue_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_16/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c95ec13b2c5ee5a2fa90a1d5e7aeb1b229a7d490 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_16/order_0.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where is the cherry really? +Answer: blue_cupboard +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: To answer this question, we need to track the movements of the cherry and the statements made by the agents. According to the story, the cherry was initially in the green_envelope, which Noah liked. However, Owen moved the cherry to the blue_bucket before exiting the front_yard. Aiden then moved the cherry to the blue_cupboard before exiting the front_yard as well. Later, Noah publicly claimed that the cherry is in the green_envelope, but Ella privately told Noah that the cherry is in the blue_bottle. However, we don't know if Ella's statement is true or false. Therefore, we need to look at the movements of the cherry after this point. The cherry is not mentioned again in the story, so we don't know if it was moved again or not. Therefore, the answer to the question is either F. green_envelope or G. blue_bottle, depending on whether Ella's statement is true or false. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_16/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..514929f91af49dad920971b65bce58778dec9e39 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_16/order_1.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Aiden really think the cherry is? +Answer: blue_cupboard +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: To answer this question, we need to trace Aiden's movements and interactions with other agents. Aiden moved the cherry to the blue_cupboard and then exited the front_yard. There is no information about any private or public interactions where Aiden revealed his actual thought about the cherry's location. Therefore, we can only rely on Aiden's last known location of the cherry, which is the blue_cupboard. So, the answer is J. blue_cupboard. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_16/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c7f419a02e2e2edad7532f4653902e8b553bcdf3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_16/order_2.txt @@ -0,0 +1,53 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Noah think Aiden thinks the cherry is? +Answer: green_envelope +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To answer this question, we need to track the movements of Aiden, Owen, Avery, Noah, and Ella regarding the cherry. From the story, we know that Aiden saw the cat and then entered the front yard with Owen, Avery, Noah, and Ella. The cherry was initially in the green envelope, and Noah liked the green envelope. However, Owen moved the cherry to the blue bucket before exiting the front yard. Avery lost his phone and stayed in the front yard for a minute before exiting. Noah also stayed in the front yard for a minute before exiting. Aiden moved the cherry to the blue cupboard before exiting the front yard. Ella stayed in the front yard for a minute before exiting. Later, in the waiting room, Noah publicly claimed that the cherry is in the green envelope, but Ella privately told Noah that the cherry is in the blue bottle. + +Now, we need to determine where Noah thinks Aiden thinks the cherry is. Since Aiden moved the cherry to the blue cupboard before exiting the front yard, he likely thinks the cherry is in the blue cupboard. However, we need to consider if any other agents' actions or claims could have influenced Noah's thoughts about Aiden's beliefs. From the story, we know that Avery privately told Noah that the lettuce is in the blue treasure chest, but there is no mention of Avery telling Noah anything about the cherry. Therefore, we can assume that Avery's claim did not affect Noah's thoughts about Aiden's beliefs regarding the cherry. + +Based on the information provided, the answer is J. blue cupboard. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_16/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..69cc97875c31e64ca09087ed7a269b3241f38c97 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_16/order_3.txt @@ -0,0 +1,65 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Owen think Noah thinks Aiden thinks the cherry is? +Answer: blue_bucket +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bucket +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. We need to find out where Owen thinks Noah thinks Aiden thinks the cherry is. This means we need to trace the chain of thoughts from Owen to Noah to Aiden to the cherry's location. + +2. According to the story, Noah publicly claimed that the cherry is in the green_envelope. This means that Owen knows that Noah thinks the cherry is in the green_envelope. + +3. However, we also know that every agent tends to lie, so we can't trust Noah's claim completely. + +4. We need to find out where Aiden thinks the cherry is. There are two possible locations: the green_envelope (where Noah claimed it is) and the blue_cupboard (where Aiden moved it to). + +5. We don't know for sure which location Aiden thinks the cherry is in, but we can make an educated guess based on the exit order. Aiden exited the front_yard before Noah, which means Noah might trust Aiden's judgment more than his own. Therefore, it's possible that Noah thinks Aiden thinks the cherry is in the blue_cupboard. + +6. Finally, we need to find out where Owen thinks Noah thinks Aiden thinks the cherry is. Based on the assumptions, Owen tends to trust agents who exited the room later than himself. Since Owen exited the front_yard before Noah and Aiden, he might not trust their judgment as much. Therefore, it's possible that Owen thinks Noah thinks Aiden thinks the cherry is in the green_envelope (where Noah claimed it is). + +7. Therefore, the answer is F. green_envelope. + +Note: This is just one possible interpretation of the story and assumptions. There may be other valid answers depending on how you interpret the characters' actions and thoughts. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_16/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a11e4d6846b119d4513112a7daa9c4c7d64f0e93 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_16/order_4.txt @@ -0,0 +1,60 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Ella think Owen thinks Noah thinks Aiden thinks the cherry is? +Answer: blue_bucket +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bucket +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Ella privately told Noah that the cherry is in the blue_bottle. +2. Noah publicly claimed that cherry is in the green_envelope. +3. Owen moved the cherry to the blue_bucket. +4. Where does Ella think Owen thinks Noah thinks Aiden thinks the cherry is? + +Based on the assumptions given, we know that Ella can only infer Noah's thoughts if she had a private interaction with him. We also know that agents tend to lie, so Noah's public claim may not reflect his actual thoughts. + +From step 1, we know that Ella thinks the cherry is in the blue_bottle. From step 2, we know that Noah claimed the cherry is in the green_envelope, but we don't know if that's his actual thought. From step 3, we know that Owen moved the cherry to the blue_bucket, but we don't know if he did it based on his own thoughts or if he was following someone else's instructions. + +So, we can't determine where Ella thinks Owen thinks Noah thinks Aiden thinks the cherry is with certainty. However, based on the given information, the most likely answer is J. blue_cupboard, since that's where Aiden moved the cherry to before exiting the front yard. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_17/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3862917928f7ffd30e6d9c216e76d6adf7d9d687 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_17/order_0.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where is the turnip really? +Answer: green_crate +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: To determine where the turnip really is, we need to track its movements throughout the story. According to the story, the turnip starts in the green_crate (2), is moved to the blue_pantry by Liam (5), then to the red_bottle by William (7), and finally ends up in the green_basket after Sophia and Benjamin move it there (20-23). Therefore, the correct answer is A. green_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_17/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..96394c12d1267235f60b62ab7a05a6127bf83ff6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_17/order_1.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does William really think the turnip is? +Answer: red_bottle +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bottle +GPT-4 Explain: To answer this question, we need to track William's movements and interactions with other agents. According to the story, William moved the turnip to the red_bottle and privately told Sophia that the turnip is in the red_bottle. Later, William privately told Hannah that the tomato is in the red_basket. We also know that agents tend to lie, so we cannot trust what William told Sophia or Hannah. However, we can infer that William thinks the turnip is not in the green_crate (moved by Liam) or the green_basket (moved by Sophia). We also know that the turnip is in the red_bottle according to statement 19. Therefore, the answer is D. red_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_17/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7833191cdac8fb16354156fa5ad981a81afa1026 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_17/order_2.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does Benjamin think William thinks the turnip is? +Answer: red_bottle +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bottle +GPT-4 Explain: To answer this question, we need to track the movements and private interactions of Benjamin and William regarding the turnip. According to the story, Benjamin and William both entered the porch and the waiting room together. William privately told Sophia that the turnip is in the red_bottle, but there is no mention of William telling Benjamin anything about the turnip. However, we know that Benjamin moved the turnip to the green_crate after Sophia moved it to the green_basket. This means that Benjamin knows the turnip was not in the green_basket when he moved it to the green_crate. + +Based on this information, we can eliminate options A, J, and K since Benjamin knows the turnip was not in those locations when he moved it to the green_crate. We can also eliminate options C, E, F, G, H, I, and L since there is no mention of the turnip being in those locations. + +This leaves us with options B and N. Liam privately told Hannah that the turnip is in the green_crate, but we don't know if Benjamin overheard this conversation or not. However, we do know that William saw a monkey after Benjamin exited the porch, which means that Benjamin exited the porch before William. Since Benjamin tends to trust agents who exit a room later than himself, he may assume that William did not see where he moved the turnip to. Therefore, Benjamin may think that William still believes the turnip is in the red_bottle, which is option D. + +So the answer is D. red_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_17/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f368863347f6ff80f116c43ae27d1100c17742cd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_17/order_3.txt @@ -0,0 +1,85 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does Sophia think Benjamin thinks William thinks the turnip is? +Answer: green_crate +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: To answer this question, we need to trace the movements and interactions of Sophia, Benjamin, and William regarding the turnip. + +1. Sophia, Liam, William, Hannah, and Benjamin entered the porch. +2. The turnip is in the green_crate. +3. Sophia made no movements and stayed in the porch for 1 minute. +4. Sophia exited the porch. +5. Liam moved the turnip to the blue_pantry. +6. Liam exited the porch. +7. William moved the turnip to the red_bottle. +8. William exited the porch. +9. Hannah made no movements and stayed in the porch for 1 minute. +10. Hannah exited the porch. +11. William saw a monkey. +12. Benjamin made no movements and stayed in the porch for 1 minute. +13. Benjamin exited the porch. +14. Sophia, Liam, William, Hannah, and Benjamin entered the waiting_room. +15. Sophia saw a mouse. +16. William privately told Sophia that the turnip is in the red_bottle. +17. Liam privately told Hannah that the turnip is in the green_crate. +18. Sophia, Benjamin, and Hannah entered the porch. +19. The turnip is in the red_bottle. +20. Sophia moved the turnip to the green_basket. +21. Sophia exited the porch. +22. Benjamin moved the turnip to the green_crate. +23. Benjamin exited the porch. +24. Hannah made no movements and stayed in the porch for 1 minute. +25. Hannah exited the porch. +26. Sophia, Benjamin, and Hannah entered the waiting_room. + +Based on the above movements and interactions, we can infer that Sophia knows the turnip was initially in the green_crate, then moved to the blue_pantry by Liam, and then to the red_bottle by William. However, William privately told Sophia that the turnip is in the red_bottle, which is where it actually is. + +Benjamin was in the porch when William moved the turnip to the red_bottle, but he made no movements and stayed there for a minute before exiting. Therefore, Benjamin does not know where the turnip actually is. + +William did not have any private or public interactions with Benjamin regarding the turnip, so Benjamin cannot infer William's thought about the turnip. + +Therefore, Sophia cannot know where Benjamin thinks William thinks the turnip is. The answer is none of the given options. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_17/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b124e2f63b8bfbab50945c03cf59abbb7c38b2ff --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_17/order_4.txt @@ -0,0 +1,58 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does Liam think Sophia thinks Benjamin thinks William thinks the turnip is? +Answer: green_crate +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: First, we need to determine where Liam thinks the turnip is. According to step 6, Liam moved the turnip to the blue_pantry. However, we also know that William privately told Sophia that the turnip is in the red_bottle (step 16) and that the turnip is actually in the red_bottle (step 19). Therefore, Liam's belief about the turnip's location is not accurate. + +Next, we need to determine where Sophia thinks Benjamin thinks William thinks the turnip is. According to step 17, Liam privately told Hannah that the turnip is in the green_crate. However, we know that the turnip is actually in the red_bottle (step 19). Therefore, Sophia would not believe that William thinks the turnip is in the green_crate. + +We also know that Sophia moved the turnip to the green_basket (step 20) and Benjamin moved it to the green_crate (step 22). Therefore, it is possible that Sophia thinks Benjamin thinks the turnip is in the green_basket or the green_crate. + +However, we need to consider Liam's exit order. Liam exited the porch before William (step 6 and 7). According to assumption 4, agents tend to trust an agent that exited the room later than themselves. Therefore, Sophia may be more likely to believe William's claim about the turnip's location (step 16) than Liam's private claim to Hannah (step 17). + +Based on this reasoning, Sophia may think that Benjamin thinks William thinks the turnip is in the red_bottle (the actual location) or the green_basket (where Sophia moved it). Therefore, the answer is either D. red_bottle or J. green_pantry. However, since the question asks where Liam thinks Sophia thinks Benjamin thinks William thinks the turnip is, we cannot definitively choose between these two options. The answer is either D. red_bottle or J. green_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_18/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..32bab3c1d4b9394f833aecfa68716561fc427658 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_18/order_0.txt @@ -0,0 +1,59 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where is the cabbage really? +Answer: green_crate +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: Step 1: Look for all the statements related to the cabbage. +- Statement 2: The cabbage is in the green_bucket. +- Statement 14: William publicly claimed that cabbage is in the green_envelope. +- Statement 26: The cabbage is in the green_bucket. +- Statement 38: William privately told Carter that the cabbage is in the green_crate. + +Step 2: Analyze the statements and eliminate the lies. +- Statement 14 and 38 contradict each other. One of them must be a lie. +- Since William privately told Carter, it is more likely that he told the truth to Carter. Therefore, statement 38 is true and statement 14 is a lie. +- Statement 2 and 26 both claim that the cabbage is in the green_bucket. Therefore, it is likely that the cabbage is really in the green_bucket. + +Step 3: Answer the question. +- The correct answer is F. green_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_18/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1909e8e07c1f0e9e7dcdf4f0f4e39487159ff629 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_18/order_1.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does Carter really think the cabbage is? +Answer: green_crate +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: To answer this question, we need to look for any information that tells us where Carter thinks the cabbage is. According to the story, Charlotte privately told Avery that the cabbage is in the green_bucket, and William privately told Carter that the cabbage is in the green_crate. However, we don't know if Carter trusts William or not. We also know that Carter moved the spinach to the green_treasure_chest, but there is no information about him moving the cabbage. + +Therefore, based on the given information, we cannot determine where Carter really thinks the cabbage is. The answer is not provided in the options given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_18/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d7f976806a5660a3c31dfbe91e3aae8547aecd58 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_18/order_2.txt @@ -0,0 +1,64 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does Avery think Carter thinks the cabbage is? +Answer: green_treasure_chest +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: Step 1: Identify the relevant information in the story. +- Avery, Aiden, Carter, William, and Charlotte entered the office and waiting room multiple times. +- The cabbage is in the green_bucket. +- Charlotte privately told Avery that the cabbage is in the green_bucket. +- Carter moved the spinach to the green_treasure_chest and Charlotte moved it to the green_bucket. +- Avery moved the cabbage to the green_crate. +- William privately told Carter that the cabbage is in the green_crate. + +Step 2: Determine Avery's thoughts about Carter's thoughts. +- Avery was in the office with Carter and Charlotte when the spinach was moved. +- Avery was also in the office with William when the cabbage's location was discussed. +- Avery moved the cabbage to the green_crate after William privately told Carter that it was there. +- There is no information about Avery's thoughts on where Carter thinks the cabbage is. + +Step 3: Answer the question. +- Based on the information given, we cannot determine where Avery thinks Carter thinks the cabbage is. +- Therefore, the answer is not provided in the multiple-choice options. +- The correct answer is not listed. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_18/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..923a11f55a5fafc99e5fa151367edf3be79770fe --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_18/order_3.txt @@ -0,0 +1,55 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does Aiden think Avery thinks Carter thinks the cabbage is? +Answer: green_bucket +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: To answer this question, we need to track the movements and interactions of Aiden, Avery, and Carter regarding the cabbage. According to the story, Avery never made any movements in the office except for the time when he moved the cabbage to the green_crate. Carter moved the spinach from the green_crate to the green_treasure_chest and then Charlotte moved it to the green_bucket. Aiden made no movements in the office except for the time when he publicly claimed that the cabbage is in the green_basket. + +We need to find out where Aiden thinks Avery thinks Carter thinks the cabbage is. Since Aiden made no movements in the office when Avery moved the cabbage to the green_crate, he cannot know where the cabbage is. However, he knows that William privately told Carter that the cabbage is in the green_crate. Therefore, Aiden can infer that Carter thinks the cabbage is in the green_crate. + +Now we need to find out where Avery thinks Carter thinks the cabbage is. Since Avery moved the cabbage to the green_crate, he knows that the cabbage is in the green_crate. Therefore, he cannot think that the cabbage is in any other place. + +Finally, we need to find out where Aiden thinks Avery thinks Carter thinks the cabbage is. Since Avery knows that the cabbage is in the green_crate, he cannot think that the cabbage is in any other place. Therefore, Aiden cannot think that Avery thinks that the cabbage is in any other place. + +Therefore, the answer is G. green_crate. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_18/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e007877dfd1e7ddc85247046fc290f829996232a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_18/order_4.txt @@ -0,0 +1,53 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does William think Aiden thinks Avery thinks Carter thinks the cabbage is? +Answer: green_bucket +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: Step 1: Identify the agents involved in the question - William, Aiden, Avery, and Carter. +Step 2: Determine the order of their exits from the office - Avery, Aiden, Carter, William. +Step 3: Determine the location of the cabbage - in the green_crate. +Step 4: Determine who knows the location of the cabbage - Charlotte privately told Avery that the cabbage is in the green_bucket, and William privately told Carter that the cabbage is in the green_crate. +Step 5: Determine who trusts whom - William trusts Carter more than Avery, as Carter exited the office after William. + +Based on the assumptions and the story, we can conclude that William thinks that Aiden thinks Avery thinks that the cabbage is in the green_basket. This is because Aiden publicly claimed that the cabbage is in the green_basket, and William trusts Carter more than Avery, so he would believe that Carter knows the true location of the cabbage. Avery made no movements in the office and did not have any private or public interactions that would suggest he knows the location of the cabbage. Therefore, William would not think that Avery knows the location of the cabbage. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_19/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c612a5e158a1a4efe6017cf7cb254d17ae8b2c22 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_19/order_0.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where is the cherry really? +Answer: blue_container +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to follow the movements of the cherry and the agents. Here is a step-by-step breakdown: + +1. The cherry is initially in the cellar. +2. Logan moves the cherry to the green_bucket. +3. Amelia moves the cherry to the green_pantry. +4. Logan privately tells Amelia that the cherry is in the blue_container. +5. Therefore, the cherry is actually in the blue_container. + +The answer is L. blue_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_19/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8137b64705e0521fe6dbffc93b4c0d3048a85e39 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_19/order_1.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does William really think the cherry is? +Answer: green_basket +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: To answer this question, we need to track William's movements and interactions with other agents. According to the story, William entered the cellar and made no movements, then exited the cellar. Later, in the waiting room, he publicly claimed that the cherry is in the blue_container. However, Amelia privately told him that the cherry is in the green_pantry, and he later entered the cellar again with Logan and Amelia. The cherry was found in the green_basket, and Ava publicly claimed that it is in the green_basket. Logan privately told Amelia that the cherry is in the blue_container. + +Based on these events, we can infer that William is lying about his belief that the cherry is in the blue_container. He was told by Amelia that it is in the green_pantry, and he entered the cellar again with Logan and Amelia, where they found the cherry in the green_basket. Therefore, the correct answer is N. green_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_19/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3ad5dab24f3783feb0bae04c844e581395ad80e4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_19/order_2.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does Ava think William thinks the cherry is? +Answer: green_basket +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: The question is asking about Ava's thoughts regarding William's thoughts on the location of the cherry. To answer this question, we need to track William's movements and interactions with other agents. + +According to the story, William entered the cellar and made no movements for 1 minute before exiting. He then publicly claimed that the cherry is in the blue_container. Later, Amelia privately told William that the cherry is in the green_pantry. William then entered the cellar again with Logan and Amelia, and the cherry was found in the green_bucket. Logan privately told Amelia that the cherry is in the blue_container. + +Based on this information, we can infer that William initially thought the cherry was in the blue_container, but after Amelia's private communication, he knew that it was actually in the green_pantry. Ava was not present during William's private conversation with Amelia, so she would not know that William's belief had changed. Therefore, Ava would think that William still believes the cherry is in the blue_container. + +The answer is B. blue_bathtub. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_19/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..511e4acf7f704019225babc01bb38027c0087bd1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_19/order_3.txt @@ -0,0 +1,62 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does Logan think Ava thinks William thinks the cherry is? +Answer: blue_container +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: This question requires a bit of deduction and inference. We need to figure out where Logan thinks Ava thinks William thinks the cherry is. + +First, we know that William publicly claimed that the cherry is in the blue_container, but Amelia privately told William that the cherry is in the green_pantry. This means that William knows the true location of the cherry, but he may or may not be lying about it. + +Next, we need to figure out where Ava thinks the cherry is. We know that Ava dislikes the beans and moved the cherry to the green_bucket. However, we don't know if she knows the true location of the cherry or if she's lying about it. + +Finally, we need to figure out where Logan thinks Ava thinks William thinks the cherry is. We know that Logan privately told Amelia that the cherry is in the blue_container, so he knows the true location of the cherry. However, we don't know if he trusts William's public claim or if he thinks William is lying. + +Based on these assumptions, we can eliminate some options. We know that the cherry is not in the blue_bathtub, red_pantry, red_crate, red_basket, blue_treasure_chest, blue_cupboard, red_bottle, red_bucket, or green_envelope. These locations are either never mentioned in the story or are contradicted by the events that take place. + +We also know that the cherry ends up in the green_basket, but we don't know if Ava knows this or if she's lying about it. Therefore, we can't say for sure that Logan thinks Ava thinks the cherry is in the green_basket. + +However, we do know that Logan moved the cherry to the green_pantry and privately told Amelia that the cherry is in the blue_container. This means that he trusts his own knowledge of the cherry's location over William's public claim. Therefore, it's likely that he thinks Ava also knows the true location of the cherry and is not lying about it. + +The only option that fits this criteria is K. green_pantry. Therefore, the answer is K. green_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_19/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..19f6295ccaf930498efa0b33ac6aa0d67c531d52 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_19/order_4.txt @@ -0,0 +1,74 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does Amelia think Logan thinks Ava thinks William thinks the cherry is? +Answer: blue_container +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: This question requires a bit of unraveling, but we can break it down step by step. + +1. Where does Amelia think Logan thinks Ava thinks William thinks the cherry is? + +2. Let's start with William's claim in step 16: "The cherry is in the blue_container." + +3. However, in step 17, Amelia privately tells William that the cherry is actually in the green_pantry. + +4. Logan, Amelia, and William then enter the cellar in step 18, and find that the cherry is indeed in the green_bucket (step 19). + +5. Logan then moves the cherry to the green_pantry (step 20), and Amelia moves it to the green_basket (step 22). + +6. In step 38, Ava publicly claims that the cherry is in the green_basket. + +7. However, in step 39, Logan privately tells Amelia that the cherry is actually in the blue_container. + +8. So, where does Amelia think Logan thinks Ava thinks William thinks the cherry is? + +9. We know that William publicly claimed the cherry is in the blue_container, but Amelia knows that it's actually in the green_pantry. + +10. Logan privately tells Amelia that the cherry is in the blue_container, so she knows that Logan knows the true location of the cherry. + +11. However, Ava publicly claims that the cherry is in the green_basket, so Amelia may think that Ava believes the cherry is there. + +12. Therefore, Amelia may think that Logan thinks Ava thinks William thinks the cherry is in the green_basket (option N). + +So the answer is N. green_basket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_2/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..971d074a15f32ba9bdcd89ddbf32524c15ebdc48 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_2/order_0.txt @@ -0,0 +1,60 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where is the melon really? +Answer: blue_suitcase +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To determine where the melon really is, we need to track its movements based on the given story and assumptions. Here are the steps: + +1. Ella moved the melon to the blue_bottle. +2. Owen moved the melon to the green_envelope. +3. Isla privately told Ella that the melon is in the green_treasure_chest. +4. Owen privately told Aiden that the melon is in the blue_suitcase. +5. Aiden moved the melon to the blue_suitcase. + +Based on these steps, we can conclude that the melon is in the blue_suitcase. Therefore, the answer is D. blue_suitcase. + +a: \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_2/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cdde0792c8bf6fdd2afbd3da21a92959d33794e3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_2/order_1.txt @@ -0,0 +1,66 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Aiden really think the melon is? +Answer: blue_suitcase +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: Step 1: Look for any information related to Aiden's thoughts on the location of the melon. + +Step 2: According to the story, Owen privately told Aiden that the melon is in the blue suitcase (line 17). + +Step 3: However, we need to consider the assumption that every agent tends to lie. Therefore, we cannot trust what Aiden told Evelyn in private (line 41). + +Step 4: We also need to consider the assumption that an agent tends to trust an agent that exited the room later than himself. According to the story, Aiden exited the back yard before Ella and Owen (line 24). Therefore, Aiden may trust their claims more than his own. + +Step 5: According to Ella's public claim, the banana is in the green basket (line 40). We can assume that this claim is a lie, based on the assumption that every agent tends to lie. + +Step 6: Therefore, we cannot trust any public claims made by the agents. + +Step 7: Based on the available information, the most likely location of the melon is the blue suitcase, as that is what Owen told Aiden in private. However, we cannot be certain of this due to the assumption that every agent tends to lie. + +Step 8: Therefore, the answer is D. blue suitcase, but with the caveat that we cannot be certain of Aiden's actual thoughts on the matter. + +a: 5 6 7 9 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_2/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d38bf99366d5f7082c31986c43078b477817ce70 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_2/order_2.txt @@ -0,0 +1,64 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Owen think Aiden thinks the melon is? +Answer: blue_suitcase +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: Step 1: Identify the agents involved in the question. The question asks about Owen's thoughts about Aiden's thoughts, so we need to focus on Owen and Aiden. + +Step 2: Determine the interactions between Owen and Aiden. According to the story, Owen privately told Aiden that the melon is in the blue_suitcase (step 17). + +Step 3: Determine the movements of Owen and Aiden. After their private interaction, Owen and Aiden both entered the back_yard (step 18), and then Owen moved the lemon to the blue_treasure_chest (step 20) before exiting the back_yard (step 21). Aiden then moved the lemon to the blue_suitcase (step 23) before exiting the back_yard (step 24). + +Step 4: Determine the exit order of Owen and Aiden. Aiden exited the back_yard after Owen (step 24), so Owen would tend to trust Aiden's thoughts. + +Step 5: Determine where Aiden thinks the melon is. According to Aiden's private communication with Evelyn (step 41), he told her that the banana is in the green_cupboard. + +Step 6: Determine where Owen thinks Aiden thinks the melon is. Since Owen would tend to trust Aiden's thoughts and Aiden thinks the banana is in the green_cupboard, Owen would think that Aiden thinks the melon is in the green_cupboard. + +Answer: N. green_cupboard. + +a: 5 6 7 9 2 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_2/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4d676dcaf4b48523b3ab87ecd4ce0410674d42a5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_2/order_3.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Ella think Owen thinks Aiden thinks the melon is? +Answer: blue_suitcase +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: To answer this question, we need to trace the movements of Ella, Owen, and Aiden regarding the melon. According to the story, Ella initially moved the melon to the blue_bottle and then exited the back_yard. Owen later moved the melon to the green_envelope and then exited the back_yard. Finally, Aiden moved the melon to the blue_suitcase before exiting the back_yard. + +Now, we need to determine where Ella thinks Owen thinks Aiden thinks the melon is. Since Ella moved the melon to the blue_bottle and then left the back_yard, she may not know where Owen moved the melon. However, we know that Owen told Aiden that the melon is in the blue_suitcase. Therefore, Ella may think that Owen thinks Aiden thinks the melon is in the blue_suitcase. + +So, the answer is D. blue_suitcase. + +a: 5 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_2/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b60c4fb59486b5293f27d152cf093883dd2442c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_2/order_4.txt @@ -0,0 +1,60 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Evelyn think Ella thinks Owen thinks Aiden thinks the melon is? +Answer: blue_treasure_chest +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: To answer this question, we need to trace the path of the melon and who knows where it is. According to the story, Ella moved the melon to the blue bottle, then Owen moved it to the green envelope, and finally, Aiden moved it to the blue suitcase. However, Owen privately told Aiden that the melon is in the blue suitcase. Therefore, Owen knows that the melon is in the blue suitcase, but he dislikes pears, not melons. + +Now, we need to find out where Aiden thinks the melon is. Since Owen told Aiden that the melon is in the blue suitcase, Aiden knows that the melon is in the blue suitcase. + +Next, we need to find out where Owen thinks Aiden thinks the melon is. Since Owen knows that the melon is in the blue suitcase, he thinks that Aiden also knows that the melon is in the blue suitcase. + +Finally, we need to find out where Evelyn thinks Ella thinks Owen thinks Aiden thinks the melon is. Since Aiden privately told Evelyn that the banana is in the green cupboard, we can assume that Evelyn trusts Aiden's word. Therefore, she thinks that Aiden knows that the melon is in the blue suitcase. Since Owen dislikes pears, not melons, we can assume that he did not tell anyone else where the melon is. Therefore, Evelyn thinks that Ella thinks Owen thinks Aiden thinks the melon is in the blue suitcase. + +Therefore, the answer is D. blue suitcase. + +a: 6 7 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_20/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0a07e47065a186edf20f8e6e2b0eead2a683ff8c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_20/order_0.txt @@ -0,0 +1,66 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where is the turnip really? +Answer: red_envelope +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: To determine where the turnip really is, we need to follow the movements of each agent and their private and public interactions. + +- Carter, Mila, Owen, Avery, and Isla entered the sunroom. +- The turnip is in the green_pantry. +- Carter made no movements and stayed in the sunroom for 1 minute. +- Carter exited the sunroom. +- Mila made no movements and stayed in the sunroom for 1 minute. +- Mila exited the sunroom. +- Owen moved the turnip to the blue_cupboard. +- Owen exited the sunroom. +- Avery moved the turnip to the red_envelope. +- Avery exited the sunroom. +- Isla made no movements and stayed in the sunroom for 1 minute. +- Isla exited the sunroom. +- Carter, Mila, Owen, Avery, and Isla entered the waiting_room. +- Avery publicly claimed that the turnip is in the blue_pantry. +- Isla privately told Carter that the turnip is in the red_envelope. + +Based on Isla's private information, we know that the turnip is actually in the red_envelope. Therefore, the answer is (I) red_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_20/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..24722ef0a403f56d291c59a4875e73ffd1dcda8c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_20/order_1.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Owen really think the turnip is? +Answer: blue_pantry +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: To determine where Owen really thinks the turnip is, we need to track the movements of the turnip and the interactions between Owen and the other agents. + +According to the story, the turnip starts in the green_pantry and is moved by Owen to the blue_cupboard. Avery then moves the turnip to the red_envelope. + +In the waiting_room, Avery publicly claims that the turnip is in the blue_pantry, but this claim may not reflect her actual thoughts. Isla privately tells Carter that the turnip is in the red_envelope, but we don't know if Owen overhears this conversation. + +There is no further mention of the turnip in the story, so we cannot definitively determine where Owen thinks the turnip is. + +Therefore, the answer is not provided in the given options. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_20/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..979a63d9d15bc90f105ae561971825f3d3eef88f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_20/order_2.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Mila think Owen thinks the turnip is? +Answer: green_pantry +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: To answer this question, we need to track the movements of Mila and Owen with respect to the turnip. Mila entered the sunroom with Carter, Owen, Avery, and Isla. She stayed there for a minute and then exited. Owen moved the turnip from the green_pantry to the blue_cupboard and then exited the sunroom. Avery moved the turnip from the blue_cupboard to the red_envelope and then exited the sunroom. Isla privately told Carter that the turnip is in the red_envelope. + +We don't have any information about Mila's thoughts or interactions with Owen regarding the turnip. However, we know that Mila was in the sunroom before Owen moved the turnip to the blue_cupboard and Avery moved it to the red_envelope. Therefore, Mila must have seen the turnip in the green_pantry before it was moved. + +Since Mila made no movements and stayed in the sunroom for a minute, she had enough time to observe Owen's movements and infer where he thinks the turnip is. We know that Owen moved the turnip to the blue_cupboard, but we don't know if he saw Avery move it to the red_envelope. Therefore, Mila could think that Owen still thinks the turnip is in the blue_cupboard. + +The answer is option J. Mila thinks Owen thinks the turnip is in the blue_cupboard. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_20/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d4a989739f9dd4a31226d50dceab6456b44f47e3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_20/order_3.txt @@ -0,0 +1,62 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Carter think Mila thinks Owen thinks the turnip is? +Answer: green_pantry +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: To answer this question, we need to track the movements of the agents and their private and public interactions. + +- Carter and Mila entered the sunroom together, but Mila exited after staying for a minute. +- Owen moved the turnip from the green_pantry to the blue_cupboard, and Avery moved it to the red_envelope. +- Isla privately told Carter that the turnip is in the red_envelope. +- Carter, Mila, Owen, Avery, and Isla entered the waiting_room together. +- Avery publicly claimed that the turnip is in the blue_pantry. + +Based on these movements and interactions, we can infer that Carter knows the turnip is in the red_envelope (since Isla told him so), but he also knows that Avery claimed it's in the blue_pantry. Mila didn't make any movements or interactions related to the turnip, so we can eliminate any options that involve her. + +Owen moved the turnip to the blue_cupboard, but we don't know if he made any public or private claims about its location. However, we do know that Avery privately told Owen that the grapes are in the red_basket. Since Avery tends to lie, we can't trust her claim about the grapes' location, but we can assume that Owen might believe her and think the grapes are in the red_basket. + +Therefore, Carter might think that Mila thinks Owen thinks the turnip is in the D. red_bottle (since that's where Avery moved the turnip to and Owen might believe Avery's claim about the grapes' location). + +The answer is D. red_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_20/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b1767c8a6de9ca874a12595807095bd7f042e4f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_20/order_4.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Isla think Carter thinks Mila thinks Owen thinks the turnip is? +Answer: green_pantry +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: To solve this question, we need to track the movements of the agents and their private and public interactions. According to the story, Carter and Mila entered the sunroom first, followed by Owen, Avery, and Isla. Carter and Mila made no movements and exited the sunroom before Owen moved the turnip to the blue_cupboard and Avery moved it to the red_envelope. Isla made no movements and exited the sunroom last. + +In the waiting room, Avery publicly claimed that the turnip is in the blue_pantry, but Isla privately told Carter that the turnip is in the red_envelope. This means that Isla knows the actual location of the turnip, but Carter may or may not know it. + +Later, Isla, Avery, and Carter entered the back yard, where Isla made no movements and exited first, followed by Avery who also made no movements. Carter then moved the persimmon to the red_box before exiting. + +In the waiting room again, Carter publicly claimed that grapes are in the blue_bucket, but Avery privately told Owen that the grapes are in the red_basket. This means that Avery knows the actual location of the grapes, but Carter may or may not know it. + +Based on these movements and interactions, we can conclude that Isla thinks that Carter thinks that Mila thinks that Owen thinks the turnip is in the red_envelope. Therefore, the answer is D. red_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_3/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c002b9567fad31ccb8b30358e5d7e312cec67c3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_3/order_0.txt @@ -0,0 +1,58 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where is the spinach really? +Answer: green_crate +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: To determine where the spinach really is, we need to follow the movements of each agent and their private and public interactions. + +- Jackson moved the spinach from the red_container to the green_crate, but then moved it back to the red_drawer after Ella privately told him that the spinach is in the red_crate. +- Jack then moved the spinach from the red_drawer to the blue_drawer. +- Ella then moved the spinach from the blue_drawer to the red_drawer. + +Therefore, the spinach is in the red_drawer. The answer is M. red_drawer. + +a: 7 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_3/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c0062c7fd4da798fdb6b133959d6e918db2c0299 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_3/order_1.txt @@ -0,0 +1,67 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Jacob really think the spinach is? +Answer: green_crate +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: To answer this question, we need to trace Jacob's movements and interactions with other agents. + +- Jacob entered the laundry with Jackson and Ella (step 17). +- The spinach was in the red_drawer (step 18). +- Jackson moved the spinach to the green_crate (step 19). +- Jacob made no movements and stayed in the laundry for 1 minute (step 21). +- Jacob exited the laundry (step 22). +- Jacob likes the red_pantry (step 28). +- Jacob, along with Amelia, Ella, and Jack, entered the patio (step 29). +- The tomato was in the green_drawer (step 30). +- Amelia moved the tomato to the green_bottle (step 31). +- Jacob made no movements and stayed in the patio for 1 minute (step 33). +- Jacob exited the patio (step 34). +- Jacob, along with Amelia, Ella, and Jack, entered the waiting_room (step 39). + +Based on these steps, we can see that Jacob never interacted with the spinach after it was moved to the green_crate by Jackson. Therefore, he would not know where the spinach is currently located. None of the options given match this answer, so the correct answer would be "Unknown." + +a: 5 6 7 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_3/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..cfc1fa6e67bd38b5a80a3794fd7d8085a50e6fe4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_3/order_2.txt @@ -0,0 +1,58 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Jackson think Jacob thinks the spinach is? +Answer: green_crate +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: To answer this question, we need to track the movements of Jackson and Jacob and their interactions with other agents. + +1. Jackson moved the spinach from the red_container to the green_crate (step 4) and then moved it back to the red_drawer (step 19). +2. Jacob made no movements in the laundry (step 10) and stayed in the laundry for 1 minute (step 11). +3. Jackson, Jacob, and Ella entered the laundry again and found the spinach in the red_drawer (step 18). + +Based on these movements, we can infer that Jackson thinks Jacob thinks the spinach is in the red_drawer (option M). + +a: 5 6 7 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_3/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..66335875c63f219b3201c708245709a3708868a4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_3/order_3.txt @@ -0,0 +1,64 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Jack think Jackson thinks Jacob thinks the spinach is? +Answer: green_crate +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: To answer this question, we need to trace the movements of Jackson, Jack, and Jacob regarding the spinach. + +First, Jackson moved the spinach from the red_container to the green_crate. Then, Jack moved the spinach from the green_crate to the blue_drawer. Finally, Ella moved the spinach from the blue_drawer to the red_drawer. + +Later, Ella privately told Jackson that the spinach is in the red_crate, but this information is not relevant to Jack's thoughts. + +Then, Jackson, Jacob, and Ella entered the laundry again and found the spinach in the red_drawer. Jackson moved the spinach from the red_drawer to the green_crate. + +Based on the assumption that an agent tends to trust another agent who exited the room later than himself, Jack would trust Jackson's movements more than Jacob's movements. + +Therefore, Jack would think that Jackson thinks the spinach is in the green_crate (option O). + +The answer is O. green_crate. + +a: 1 5 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_3/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..708974848435a8e7351c13f1bfb6bba29a79d5c4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_3/order_4.txt @@ -0,0 +1,63 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Ella think Jack thinks Jackson thinks Jacob thinks the spinach is? +Answer: green_crate +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: This is a complex question that requires careful analysis. Let's break it down step by step: + +1. Ella privately told Jackson that the spinach is in the red_crate. +2. Jack privately told Jacob that the spinach is in the red_drawer. +3. Jackson moved the spinach to the green_crate. +4. Ella moved the spinach to the red_drawer. + +Based on these actions, we can infer that Ella knows the true location of the spinach (in the red_drawer) and that Jack knows that Jackson thinks the spinach is in the red_drawer. However, we don't know where Ella thinks Jack thinks Jackson thinks the spinach is. + +To answer the question, we need to look for clues about Ella's thought process. We know that she moved the spinach to the red_drawer after Jackson moved it to the green_crate, which suggests that she trusts her own knowledge over Jackson's actions. We also know that she didn't have any private or public interactions with Jack or Jacob after they left the laundry, so she doesn't have any new information about their thoughts. + +Therefore, the most likely answer is that Ella still thinks Jack thinks Jackson thinks the spinach is in the red_drawer, since that was the last location Jack mentioned to Jacob and Ella knows that the spinach is actually in the red_drawer. The answer is M. red_drawer. + +a: 5 6 1 2 \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_4/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e7e8c0e3453bb3ca7a4d56572f84a84b7136fb48 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_4/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where is the corn really? +Answer: green_bottle +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to track the movements of the corn and the statements made by the agents. According to the story, Nathan moved the corn to the red_envelope, then Lily moved it to the green_envelope, then Amelia moved it to the green_drawer, then Alexander moved it to the green_box, and finally Abigail moved it back to the green_bottle. In the waiting_room, Amelia publicly claimed that the corn is in the green_bottle, but Abigail privately told her that it is in the green_envelope. Since Abigail moved the corn to the green_bottle after moving it to the green_envelope, we can assume that she is lying to Amelia in the private conversation. Therefore, the corn is actually in the green_bottle. The answer is F. green_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_4/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8962bafb8b96064d2be6961b85e61f39db42978f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_4/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Amelia really think the corn is? +Answer: green_envelope +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To answer this question, we need to track Amelia's movements and interactions with other agents. According to the story, Amelia moved the corn to the green_drawer and publicly claimed that the corn is in the green_bottle. However, Abigail privately told Amelia that the corn is in the green_envelope. We know that Amelia tends to lie, so we cannot trust her public claim. We also know that Amelia trusts Abigail because Abigail exited the hallway after Amelia. Therefore, we can infer that Amelia really thinks the corn is in the green_envelope, which is option G. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_4/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..108c1a34c7da1cb95c0b2aa3e2d25c79de23cade --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_4/order_2.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Nathan think Amelia thinks the corn is? +Answer: green_bottle +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to track the movements of the corn and the interactions between Nathan and Amelia. According to the story, Nathan moved the corn to the red_envelope, and Abigail privately told Amelia that the corn is in the green_envelope. However, Amelia publicly claimed that the corn is in the green_bottle. This means that Amelia is lying about the location of the corn. + +Since Nathan exited the hallway before Amelia made her claim, he would not have heard her public claim. However, Abigail privately told Amelia that the corn is in the green_envelope, and Nathan and Amelia were both in the lounge together with Abigail. Therefore, Nathan could have overheard their private conversation and knows that Amelia actually thinks the corn is in the green_envelope. + +Therefore, the answer is G. green_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_4/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..49ad00fe0a708132f67ea190c53e25334a2f9688 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_4/order_3.txt @@ -0,0 +1,51 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Lily think Nathan thinks Amelia thinks the corn is? +Answer: red_envelope +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: To answer this question, we need to track the movements of the corn and the agents' interactions. Nathan moved the corn from the green_bottle to the red_envelope, and Abigail privately told Amelia that the corn is in the green_envelope. Lily moved the corn from the green_envelope to the green_drawer, and Alexander moved it to the green_box before Abigail moved it back to the green_bottle. In the waiting room, Amelia publicly claimed that the corn is in the green_bottle, but Abigail privately told her that it's in the green_envelope. + +Based on this information, we can infer that Lily thinks Nathan thinks Amelia thinks the corn is in the green_envelope. Lily moved the corn from the green_envelope to the green_drawer after Nathan moved it to the red_envelope, so she knows that Nathan didn't leave the corn in the green_envelope. Abigail privately told Amelia that the corn is in the green_envelope, so Amelia may think that the corn is there. Nathan exited the hallway before Abigail moved the corn back to the green_bottle, so he may not know where the corn ended up. Therefore, Lily thinks Nathan thinks Amelia thinks the corn is in the green_envelope. + +The answer is G. green_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_4/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..17920b7dc362392421fdaaae255d01b9914eec0c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_4/order_4.txt @@ -0,0 +1,63 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Alexander think Lily thinks Nathan thinks Amelia thinks the corn is? +Answer: red_envelope +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: This is a complex question that requires careful analysis. We need to trace the movements of the corn and the agents to determine where Alexander thinks Lily thinks Nathan thinks Amelia thinks the corn is. + +Step 1: Start with the last piece of information we have about the corn. Amelia privately told Nathan that the corn is in the green_cupboard. + +Step 2: Trace back to where Nathan was when he received this information. Nathan was in the waiting_room with Abigail and Amelia. + +Step 3: Trace back to where Amelia was before she told Nathan about the corn. She was in the bedroom with Alexander, Lily, and Nathan. + +Step 4: Trace back to where Lily was before Amelia left the bedroom. She had moved the green_pepper to the red_container. + +Step 5: Trace back to where Nathan was before Lily moved the green_pepper. He had exited the bedroom. + +Step 6: Trace back to where Alexander was before Nathan left the bedroom. He had made no movements and stayed in the bedroom for 1 minute. + +Step 7: Therefore, Alexander thinks Lily thinks Nathan thinks Amelia thinks the corn is in the red_container. + +The answer is B. red_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_5/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..43f97f1747b861ed667eaa66b49d16d3fd9b0f9c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_5/order_0.txt @@ -0,0 +1,62 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where is the sweet_potato really? +Answer: red_box +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: Step 1: Look for all the movements related to the sweet_potato. +- Sophia moved the sweet_potato to the green_bottle. +- Hannah moved the sweet_potato to the green_box. +- Jackson moved the sweet_potato to the red_box. +Step 2: Look for any public or private claims related to the sweet_potato. +- Hannah publicly claimed that sweet_potato is in the green_bottle. +- Jackson privately told Sophia that the sweet_potato is in the red_box. +Step 3: Determine which claim is true based on the assumptions. +- Hannah tends to lie, so her claim may not be true. +- Jackson may be lying or telling the truth, but he is not a reliable source since he had a private conversation with Sophia. +- Sophia's movements were before Hannah and Jackson's movements, so she exited the front_yard later than both of them. Therefore, she is a more reliable source than Hannah or Jackson. +- Sophia moved the sweet_potato to the green_bottle, but Jackson claimed it is in the red_box. Therefore, Jackson is lying and the sweet_potato is actually in the green_bottle. +Step 4: Choose the correct answer. +The sweet_potato is in the N. green_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_5/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..874f525727f8b02ca59a37c9fa3766e98db13cff --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_5/order_1.txt @@ -0,0 +1,59 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Sophia really think the sweet_potato is? +Answer: red_box +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: To answer this question, we need to track Sophia's movements and any private or public interactions she had regarding the sweet_potato. + +1. Sophia entered the front_yard with the sweet_potato in the red_box. +2. Sophia moved the sweet_potato to the green_bottle. +3. Sophia exited the front_yard. +16. Hannah publicly claimed that sweet_potato is in the green_bottle. +17. Jackson privately told Sophia that the sweet_potato is in the red_box. + +Based on the above information, we know that Sophia moved the sweet_potato from the red_box to the green_bottle. However, we also know that Jackson privately told Sophia that the sweet_potato is in the red_box. Since Sophia knows this information, she may be lying about where she thinks the sweet_potato is. + +Therefore, the answer to the question is K. red_box. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_5/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6187ebe516ab20e57c7f4c5c3a43fcc17ca786de --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_5/order_2.txt @@ -0,0 +1,65 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Jackson think Sophia thinks the sweet_potato is? +Answer: red_box +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: To answer this question, we need to track the movements of the sweet_potato and the interactions between Jackson and Sophia. + +Step 1: Sophia moved the sweet_potato from the red_box to the green_bottle. + +Step 2: Sophia exited the front_yard. + +Step 3: Hannah moved the sweet_potato from the green_bottle to the green_box. + +Step 4: Jackson moved the sweet_potato from the green_box to the red_box. + +Step 5: Jackson privately told Sophia that the sweet_potato is in the red_box. + +Based on these steps, we know that Jackson knows the sweet_potato is in the red_box and he told Sophia this information privately. However, we don't know where Jackson thinks Sophia thinks the sweet_potato is. + +To answer the question, we need to look for any information about Jackson's thoughts on Sophia's beliefs about the sweet_potato's location. There is no direct information about this in the story. + +Therefore, the answer is unknown or cannot be determined from the given information. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_5/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..56ff8bbb650ccae8196c2d768ab34da042f238d8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_5/order_3.txt @@ -0,0 +1,53 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Avery think Jackson thinks Sophia thinks the sweet_potato is? +Answer: green_bottle +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To answer this question, we need to track the movements of Avery, Jackson, and Sophia regarding the sweet_potato. According to the story, Sophia initially moved the sweet_potato from the red_box to the green_bottle, then Hannah moved it to the green_box, and finally, Jackson moved it back to the red_box. Sophia exited the front_yard after moving the sweet_potato to the green_bottle, and Avery made no movements regarding the sweet_potato. + +We also know that Jackson privately told Sophia that the sweet_potato is in the red_box, and Hannah publicly claimed that the sweet_potato is in the green_bottle. + +Since Avery did not witness any of these movements or interactions, we cannot determine where Avery thinks Jackson thinks Sophia thinks the sweet_potato is. Therefore, the answer is not given in the options provided. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_5/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b2f28910fa049620ac5f8399bac76aef59e346c1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_5/order_4.txt @@ -0,0 +1,74 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Hannah think Avery thinks Jackson thinks Sophia thinks the sweet_potato is? +Answer: green_bottle +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: This is a complex question that requires careful analysis of the story and assumptions. Let's break it down step by step: + +1. Hannah privately told Avery that the peach is in the red_basket. +2. Avery made no movements and stayed in the basement for 1 minute. +3. Avery exited the basement. +4. Hannah, Jackson and Sophia entered the waiting_room. + +Based on assumption (2), we know that Hannah can only infer what Avery thinks if they have been in the same place or had private or public interactions. Since Avery made no movements in the basement and Hannah privately told Avery about the peach, we can assume that they had a private interaction in the basement. + +Next, we need to determine where the peach is currently located. According to step 35, Hannah moved the peach to the red_basket before exiting the basement. However, in step 39, Jackson publicly claimed that the peach is in the red_container. Since we know that every agent tends to lie (assumption 3), we cannot trust Jackson's claim. + +Therefore, we can conclude that the peach is in the red_basket, as Hannah privately told Avery. Now we need to determine where Hannah thinks Avery thinks Jackson thinks Sophia thinks the sweet_potato is. + +According to step 16, Hannah publicly claimed that the sweet_potato is in the green_bottle. However, we cannot trust this claim since every agent tends to lie. We need to look for private or public interactions between Hannah, Avery, Jackson, and Sophia to determine where they think the sweet_potato is. + +In step 11, Hannah moved the sweet_potato to the green_box before exiting the front_yard. However, in step 17, Jackson privately told Sophia that the sweet_potato is in the red_box. Since we know that every agent tends to lie, we cannot trust Jackson's claim. + +Therefore, we can conclude that Hannah thinks the sweet_potato is in the green_box, since she moved it there before exiting the front_yard. Now we need to determine where Avery thinks Jackson thinks Sophia thinks the sweet_potato is. + +There are no private or public interactions between Avery, Jackson, and Sophia regarding the sweet_potato, so we need to look for their movements. According to step 8, Avery likes the green_pantry, but we cannot infer anything about the sweet_potato from this information. + +According to step 1, Sophia, Noah, Avery, Hannah, and Jackson entered the front_yard together. In step 3, Sophia moved the sweet_potato to the green_bottle before exiting the front_yard. In step 5, Noah made no movements and stayed in the front_yard for 1 minute. In step 7, Noah exited the front_yard. In step 9, Avery made no movements and stayed in the front_yard for 1 minute. In step 10, Avery exited the front_yard. In step 11, Hannah moved the sweet_potato to the green_box before exiting the front_yard. In step 13, Jackson moved the sweet_potato to the red_box before exiting the front_yard. + +Based on assumption (1), we know that an agent witnesses everything and every movement before exiting a place. Therefore, we can conclude that Avery witnessed Sophia moving the sweet_potato to the green_bottle and Hannah moving the sweet_potato to the green_box before exiting the front_yard. We cannot infer anything about what Jackson thinks since he did not make any movements regarding the sweet_potato. + +Therefore, we can conclude that Hannah thinks Avery thinks Jackson thinks Sophia thinks the sweet_potato is in the green_box (option O). \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_6/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7325cb0d351e1ac9bffefbb2ffab922097a7840a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_6/order_0.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where is the orange really? +Answer: blue_bucket +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bucket +GPT-4 Explain: To answer this question, we need to track the movements of the orange and the statements made by the agents. According to the story, the orange was initially in the green_box in the laundry. Jacob moved it to the blue_bottle, and then Jackson moved it to the red_container. Isabella later moved it to the blue_bucket in the laundry. Jackson publicly claimed that the orange is in the red_container, but Owen privately told Hannah that the orange is in the red_container. However, Hannah privately told Isabella that the orange is in the blue_bottle. Therefore, based on the story and assumptions, the orange is actually in the blue_bottle. The answer is D. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_6/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..43f531dde68ee538a751ee6afc51f818db613887 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_6/order_1.txt @@ -0,0 +1,60 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Owen really think the orange is? +Answer: red_container +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: Step 1: Look for any information related to Owen's thoughts about the orange. +- According to step 17, Owen privately told Hannah that the orange is in the red_container. +- According to step 42, Owen lost his watch. This information is not relevant to the question. + +Step 2: Determine the correct answer based on the information found. +- Owen privately told Hannah that the orange is in the red_container, so Owen really thinks that the orange is in the red_container. +- Therefore, the answer is B. red_container. + +Final answer: B. red_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_6/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..62948a9451dcb43cf5b808d830344b20490c1831 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_6/order_2.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Isabella think Owen thinks the orange is? +Answer: red_container +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: To answer this question, we need to track the movements and interactions of Isabella and Owen regarding the orange. According to the story, Isabella publicly claimed that the orange is in the blue_bucket, while Owen privately told Hannah that the orange is in the red_container. Isabella later moved the orange to the blue_bucket in the laundry. However, we don't have any information about Owen's thoughts on the location of the orange after he privately told Hannah about it. Therefore, we cannot determine where Isabella thinks Owen thinks the orange is. The answer is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_6/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..bef53b337d233418499f2d6572e91ac0c7ad2811 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_6/order_3.txt @@ -0,0 +1,63 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Jacob think Isabella thinks Owen thinks the orange is? +Answer: blue_bottle +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bottle +GPT-4 Explain: To answer this question, we need to trace the movements of Jacob, Isabella, and Owen regarding the orange. + +1. Jacob moved the orange from the green_box to the blue_bottle. +2. Jackson moved the orange from the blue_bottle to the red_container. +3. Isabella moved the orange from the red_container to the blue_bucket. +4. Owen privately told Hannah that the orange is in the red_container. + +Based on these movements, we know that Jacob last saw the orange in the blue_bottle, but he doesn't know that Jackson moved it to the red_container. Isabella last moved the orange to the blue_bucket, but she doesn't know that Owen told Hannah it's in the red_container. + +Therefore, Jacob thinks Isabella thinks the orange is in the blue_bucket, but in reality, it's in the red_container. + +The answer is C. blue_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_6/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d36eacb8b15fd89c38f9ebd9447b5ed6739db050 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_6/order_4.txt @@ -0,0 +1,66 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Hannah think Jacob thinks Isabella thinks Owen thinks the orange is? +Answer: green_box +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: To solve this question, we need to track the movements and interactions of Hannah, Jacob, Isabella, and Owen regarding the orange. + +First, Hannah entered the laundry with the group and made no movements before exiting. She then saw a monkey and lost her watch before rejoining the group in the waiting room. + +Jacob moved the orange from the green_box to the blue_bottle before exiting the laundry. + +Jackson saw a dog and moved the orange from the blue_bottle to the red_container before exiting the laundry. + +Isabella made no movements in the laundry but later claimed publicly that the orange is in the blue_bucket. She then lost her watch before rejoining the group in the waiting room. + +Owen made no movements in the laundry but privately told Hannah that the orange is in the red_container. He later lost his watch before rejoining the group in the waiting room. + +In the second visit to the laundry, Isabella moved the orange from the red_container to the blue_bucket before exiting. + +Based on these movements and interactions, we can determine that Hannah thinks Jacob thinks Isabella thinks the orange is in the blue_bucket. Therefore, the answer is C. blue_bucket. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_7/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7f742150692b2ac983f5711f3b594c1c0ce9dd16 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_7/order_0.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where is the lime really? +Answer: green_bottle +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: To determine the location of the lime, we need to track its movements throughout the story. Benjamin initially moved the lime to the green_treasure_chest, but we don't know if it stayed there. Isabella then moved the lime to the blue_crate, but again, we don't know if it stayed there. Chloe then moved the lime to the green_envelope, but we still don't know if it stayed there. Finally, Sophia moved the lime back to the green_bottle. Therefore, the lime is really in the green_bottle. The answer is A. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_7/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..948228d4ced89de3602efcac12c5aea80bff7b15 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_7/order_1.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Amelia really think the lime is? +Answer: green_envelope +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To answer this question, we need to trace Amelia's movements and any private or public interactions she had regarding the lime. According to the story, Amelia did not move the lime at any point. However, in step 15, she publicly claimed that the lime is in the green_bottle. Therefore, the correct answer is A. green_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_7/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..35204523985fb6827bd65cec72e0fbcbd8c1d1ad --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_7/order_2.txt @@ -0,0 +1,68 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Sophia think Amelia thinks the lime is? +Answer: green_envelope +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: Step 1: Identify the agents involved in the question. The question asks about Sophia's thoughts about Amelia's thoughts, so we need to focus on Sophia and Amelia's movements and interactions. + +Step 2: Trace Sophia and Amelia's movements and interactions. Sophia and Amelia were together with Isabella in the laundry (steps 17-22), and then they all entered the waiting room (step 27). Later, Amelia privately told Chloe that the beans are in the green_pantry (step 41). + +Step 3: Determine where Amelia was when she publicly claimed that the lime is in the green_bottle (step 15). Amelia made this claim in the waiting room, which means she must have moved there after leaving the porch (step 10). + +Step 4: Determine where Sophia was when Amelia made the public claim. Sophia was also in the waiting room at this time (step 27). + +Step 5: Determine where the lime was at the time of Amelia's public claim. According to step 15, Amelia claimed that the lime is in the green_bottle. + +Step 6: Determine where Amelia moved the beans to after Isabella moved them to the blue_bottle (steps 18-20). Amelia moved the beans to the red_box (step 24). + +Step 7: Determine where Sophia moved the beans to after Amelia moved them to the red_box (steps 23-24). Sophia moved the beans to the blue_drawer (steps 33-34). + +Step 8: Determine where Chloe moved the beans to after Sophia moved them to the blue_drawer (steps 35-36). Chloe moved the beans to the blue_bottle. + +Step 9: Determine where Amelia moved the beans to after Chloe moved them to the blue_bottle (steps 37-38). Amelia moved the beans to the green_pantry. + +Step 10: Determine where Sophia thinks Amelia thinks the lime is. Since Amelia publicly claimed that the lime is in the green_bottle and Sophia was present in the waiting room at that time, Sophia knows that Amelia thinks the lime is in the green_bottle. Therefore, the answer is A. green_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_7/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ae7bb80e55b4cf94e63ddbde1d577604a5dc3f12 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_7/order_3.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Chloe think Sophia thinks Amelia thinks the lime is? +Answer: green_envelope +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: To answer this question, we need to trace the movements and interactions of Chloe, Sophia, and Amelia regarding the lime. According to the story, Chloe moved the lime to the green_envelope, Sophia moved it back to the green_bottle, and Amelia publicly claimed that the lime is in the green_bottle. However, we need to determine where Chloe thinks Sophia thinks Amelia thinks the lime is. + +Based on the assumptions given, Chloe can only infer Sophia's thoughts if they have been in the same place or have had private or public interactions. From the story, we know that Chloe and Sophia were both in the porch and the waiting_room together, but there is no mention of them having any private interactions. Therefore, Chloe can only base her inference on Sophia's public claim. + +Sophia publicly claimed that the beans are in the red_box, not the lime. Therefore, Chloe cannot infer where Sophia thinks Amelia thinks the lime is. The answer is not provided in the options given. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_7/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4c2d64315598bca9a163b8fbe7d33306e181ffa9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_7/order_4.txt @@ -0,0 +1,58 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Isabella think Chloe thinks Sophia thinks Amelia thinks the lime is? +Answer: blue_crate +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: This is a complex question that requires careful analysis. We need to trace the movements of the lime and the interactions between the characters to determine where Isabella thinks Chloe thinks Sophia thinks Amelia thinks the lime is. + +First, we know that Benjamin moved the lime to the green_treasure_chest, but then Isabella moved it to the blue_crate. Chloe then moved it to the green_envelope, and finally Sophia moved it back to the green_bottle. This means that the lime ended up in the green_bottle, but each character may have a different belief about where it is. + +Next, we need to consider the public and private claims made by the characters. Amelia publicly claimed that the lime is in the green_bottle, while Sophia privately told Benjamin the same thing. Isabella, Sophia, and Amelia later entered the laundry, where the beans were in the blue_suitcase. Isabella moved the beans to the blue_bottle, and Sophia later moved them to the blue_drawer. Chloe then moved the beans back to the blue_bottle, and finally Amelia moved them to the green_pantry. Sophia publicly claimed that the beans are in the red_box, while Amelia privately told Chloe that they are in the green_pantry. + +Based on this information, we can determine that Isabella thinks Chloe thinks Sophia thinks the lime is in the green_bottle. This is because Isabella knows that the lime ended up in the green_bottle, and she also knows that Sophia privately told Benjamin that the lime is in the green_bottle. Chloe was not present for this private conversation, so she may not know that Sophia believes the lime is in the green_bottle. However, Isabella knows that Chloe moved the lime to the green_envelope, which is a different location. Therefore, Isabella believes that Chloe has a different belief about where the lime is. Sophia and Amelia both publicly claimed that the lime is in the green_bottle, so Isabella believes that Chloe thinks Sophia thinks Amelia thinks the lime is in the green_bottle. + +The answer is A. green_bottle. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_8/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4849323372e191cea0e76b3aca6fc540def4f357 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_8/order_0.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where is the carrot really? +Answer: red_pantry +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: To answer this question, we need to track the movements of the carrot and the statements made by the agents. According to the story, the carrot was initially in the red_pantry, then moved to the red_bucket by Avery, then to the blue_crate by Jack, then to the green_box by Chloe, and finally to the red_pantry by Sophia. Therefore, the correct answer is K. red_pantry. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_8/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9e2044c08fc131d9714e230420ffd56a609c81c9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_8/order_1.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Chloe really think the carrot is? +Answer: green_box +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: To answer this question, we need to track Chloe's movements and interactions with other agents related to the carrot. According to the story, Chloe moved the carrot to the green_box and then exited the garage. There is no mention of Chloe having any private or public interactions related to the carrot after that. Therefore, Chloe really thinks the carrot is in the green_box, which is option N. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_8/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..fa4820f91a773e9740581bd0ee2a5c5bc8308eee --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_8/order_2.txt @@ -0,0 +1,56 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Amelia think Chloe thinks the carrot is? +Answer: red_bucket +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: To answer this question, we need to track the movements of Amelia and Chloe and their interactions with the carrot. According to the story, Chloe moved the carrot to the green_box, which means she knows the carrot's location. Amelia, on the other hand, did not move the carrot and lost his phone while in the garage. + +There is no direct interaction between Amelia and Chloe regarding the carrot's location. However, we know that Sophia privately told Jack that the carrot is in the green_box. Since Chloe was in the same place as Sophia, she could have overheard the conversation and know the carrot's location. + +Therefore, Amelia might think that Chloe thinks the carrot is in the green_box. The answer is N. green_box. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_8/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ae6c99ab784119222ebf9bcdbb8fbd2404247927 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_8/order_3.txt @@ -0,0 +1,64 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Avery think Amelia thinks Chloe thinks the carrot is? +Answer: red_bucket +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: This is a complex question that requires careful analysis of the story and the assumptions given. To break it down, we need to identify the agents involved and their movements and interactions related to the carrot. + +First, we know that Avery moved the carrot from the red_pantry to the red_bucket, and Sophia later moved it back to the red_pantry. Jack then moved the carrot to the blue_crate. Chloe then moved the carrot to the green_box. We also know that Avery dislikes cherries and likes the red_pantry. + +Next, we need to consider the interactions between Amelia, Chloe, and Avery related to the carrot. We know that Amelia lost his phone and made no movements in the garage or closet related to the carrot. Chloe made no movements in the closet related to the carrot, but did move the carrot to the green_box in the garage. Sophia privately told Jack that the carrot is in the green_box, but we don't know if Amelia or Chloe overheard this conversation. + +Based on these movements and interactions, we can eliminate several answer choices. We know that the carrot is not in the blue_pantry or the red_box, as these locations are not mentioned in the story. We also know that the carrot is not in the green_envelope, as this location is not mentioned and no agent has claimed that the carrot is there. + +To determine where Avery thinks Amelia thinks Chloe thinks the carrot is, we need to consider Avery's knowledge of the carrot's location and his interactions with Amelia and Chloe. We know that Avery moved the carrot to the red_bucket and later exited the garage. Amelia made no movements related to the carrot and later exited the garage after Avery. Chloe moved the carrot to the green_box and later exited the garage after Sophia. + +Based on the assumption that agents tend to trust those who exit a room later than themselves, Avery may trust Sophia's claim that the carrot is in the green_box. However, we don't know if Avery heard this claim or if he trusts Sophia. We also don't know if Avery has any reason to believe that Amelia or Chloe have a different opinion on the carrot's location. + +Given these uncertainties, it's difficult to determine where Avery thinks Amelia thinks Chloe thinks the carrot is. However, based on Avery's movements and preferences, it's possible that he thinks Chloe thinks the carrot is in the green_box, as this is where Chloe moved the carrot and Avery likes the red_pantry, which is not a viable answer choice. Therefore, the best answer choice is N. green_box. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_8/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c682b3f55890bb2fe9e29aa8149dcdf24f1610b3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_8/order_4.txt @@ -0,0 +1,78 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Sophia think Avery thinks Amelia thinks Chloe thinks the carrot is? +Answer: red_bucket +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: This is a complex question that requires careful analysis. We need to trace the path of the carrot and the movements of the agents to determine where Sophia thinks Avery thinks Amelia thinks Chloe thinks the carrot is. + +According to the story, the carrot starts in the red_pantry, is moved to the red_bucket by Avery, then to the blue_crate by Jack, and finally to the green_box by Chloe. + +Sophia privately tells Jack that the carrot is in the green_box, but we need to determine where Sophia thinks Avery thinks Amelia thinks Chloe thinks the carrot is. + +We know that Avery dislikes the cherry and likes the red_pantry, but we don't have any information about what Avery thinks about the carrot. + +Amelia loses his phone and makes no movements in the garage or closet, so we can eliminate him from consideration. + +Chloe makes no movements in the closet for one minute, but we don't have any information about what she thinks about the carrot. + +Therefore, we need to focus on Sophia's interactions with Avery and Jack. + +Sophia privately tells Jack that the carrot is in the green_box, but we don't know if Jack trusts Sophia or not. + +Sophia publicly claims that the watermelon is in the red_envelope, but we don't know if she is lying or not. + +Avery exits the garage before Sophia, so she may not trust him as much as Jack. + +Based on this analysis, we can eliminate options A, B, C, D, E, F, G, H, I, J, and O. + +The only options left are K (red_pantry) and M (red_bucket). + +Since we know that Avery likes the red_pantry, Sophia may think that Avery thinks the carrot is in the red_pantry. + +Therefore, the answer is K (red_pantry). \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_9/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c523160056f0742332ee9aa94911db19247b0631 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_9/order_0.txt @@ -0,0 +1,80 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where is the watermelon really? +Answer: blue_container +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to track the movements of the watermelon and the statements made by the agents. + +1. Nathan, Elizabeth, Carter, Jacob, and Isla entered the kitchen. +2. The watermelon is in the blue_bottle. +3. Nathan made no movements and stayed in the kitchen for 1 minute. +4. Nathan exited the kitchen. +5. Elizabeth moved the watermelon to the red_envelope. +6. Elizabeth exited the kitchen. +7. Carter moved the watermelon to the blue_cupboard. +8. Carter exited the kitchen. +9. Jacob made no movements and stayed in the kitchen for 1 minute. +10. Jacob exited the kitchen. +11. Isla made no movements and stayed in the kitchen for 1 minute. +12. Carter dislikes the cherry. +13. Isla exited the kitchen. +14. Nathan, Elizabeth, Carter, Jacob, and Isla entered the waiting_room. +15. Carter publicly claimed that watermelon is in the red_envelope. +16. Isla privately told Carter that the watermelon is in the blue_container. +17. Jacob, Carter, and Elizabeth entered the kitchen. +18. The watermelon is in the blue_cupboard. +19. Jacob moved the watermelon to the red_envelope. +20. Jacob exited the kitchen. +21. Carter moved the watermelon to the green_bucket. +22. Carter exited the kitchen. +23. Elizabeth moved the watermelon to the blue_container. +24. Elizabeth exited the kitchen. +25. Jacob, Carter, and Elizabeth entered the waiting_room. + +Based on the movements and statements, we can see that the watermelon was initially in the blue_bottle, then moved to the red_envelope by Elizabeth, then to the blue_cupboard by Carter, and finally to the blue_container by Elizabeth. + +Carter publicly claimed that the watermelon is in the red_envelope, but Isla privately told him that it is in the blue_container. Jacob then moved the watermelon from the blue_cupboard to the red_envelope, and Carter moved it to the green_bucket before Elizabeth moved it to the blue_container. + +Therefore, the correct answer is I. blue_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_9/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4711b6e7637801f8825ac470fceaacab04e84c21 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_9/order_1.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Isla really think the watermelon is? +Answer: blue_cupboard +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: To answer this question, we need to track Isla's movements and interactions with other agents. According to the story, Isla made no movements in the kitchen and stayed there for one minute before exiting. Later, in the waiting room, Isla privately told Carter that the watermelon is in the blue_container. However, we cannot assume that Isla is telling the truth, as all agents tend to lie. Therefore, we need to look for further evidence. + +When Jacob, Carter, and Elizabeth entered the kitchen, they found the watermelon in the blue_cupboard. Jacob moved the watermelon to the red_envelope before exiting, and Carter moved it to the green_bucket before exiting. Elizabeth then moved the watermelon to the blue_container before exiting. + +Based on this information, we can infer that Isla's private claim to Carter that the watermelon is in the blue_container is likely false, as the watermelon was not in the blue_container when Jacob, Carter, and Elizabeth entered the kitchen. Therefore, Isla's actual thought about the watermelon's location is unknown. + +The answer is not provided in the options given, as Isla's actual thought about the watermelon's location cannot be determined based on the given information. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_9/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8a9ad39a1c51e5033501734463382a08d6351f98 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_9/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Carter think Isla thinks the watermelon is? +Answer: blue_container +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: To answer this question, we need to track the movements and interactions of Carter and Isla regarding the watermelon. According to the story, Carter publicly claimed that the watermelon is in the red_envelope, but Isla privately told Carter that the watermelon is in the blue_container. Later, Jacob moved the watermelon to the red_envelope, and then Carter moved it to the green_bucket. Therefore, Carter knows that the watermelon was not in the red_envelope when he made his public claim, and he also knows that Isla's private information was correct. Based on this information, we can conclude that Carter thinks Isla thinks the watermelon is in the blue_container (option I). Therefore, the answer is I. blue_container. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_9/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d09c18f3267d58920b29e0c08fdd1c0f62dc08bf --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_9/order_3.txt @@ -0,0 +1,108 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Elizabeth think Carter thinks Isla thinks the watermelon is? +Answer: red_envelope +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: The question is asking for Elizabeth's thoughts about Carter's thoughts about Isla's thoughts on the location of the watermelon. To solve this, we need to track the movements of the watermelon and the interactions between the characters. + +1. Nathan, Elizabeth, Carter, Jacob, and Isla entered the kitchen. +2. The watermelon is in the blue_bottle. +3. Nathan made no movements and stayed in the kitchen for 1 minute. +4. Nathan exited the kitchen. +5. Elizabeth moved the watermelon to the red_envelope. +6. Elizabeth exited the kitchen. +7. Carter moved the watermelon to the blue_cupboard. +8. Carter exited the kitchen. +9. Jacob made no movements and stayed in the kitchen for 1 minute. +10. Jacob exited the kitchen. +11. Isla made no movements and stayed in the kitchen for 1 minute. +12. Carter dislikes the cherry. +13. Isla exited the kitchen. + +At this point, only Nathan, Elizabeth, Carter, Jacob, and Isla know the location of the watermelon, and Carter is the last one to have moved it. + +14. Nathan, Elizabeth, Carter, Jacob, and Isla entered the waiting_room. +15. Carter publicly claimed that the watermelon is in the red_envelope. +16. Isla privately told Carter that the watermelon is in the blue_container. + +Now Carter knows that the watermelon is not in the red_envelope, but he doesn't know that Isla knows the true location. + +17. Jacob, Carter, and Elizabeth entered the kitchen. +18. The watermelon is in the blue_cupboard. +19. Jacob moved the watermelon to the red_envelope. +20. Jacob exited the kitchen. +21. Carter moved the watermelon to the green_bucket. +22. Carter exited the kitchen. +23. Elizabeth moved the watermelon to the blue_container. +24. Elizabeth exited the kitchen. + +Now Elizabeth knows the true location of the watermelon, but Carter doesn't know that she knows. + +25. Jacob, Carter, and Elizabeth entered the waiting_room. +26. Jacob, Isla, Elizabeth, and Carter entered the porch. +27. The banana is in the red_drawer. +28. Jacob moved the banana to the blue_treasure_chest. +29. Isla likes the blue_bottle. +30. Jacob exited the porch. +31. Isla moved the banana to the green_treasure_chest. +32. Isla exited the porch. +33. Elizabeth moved the banana to the green_bathtub. +34. Elizabeth exited the porch. +35. Carter moved the banana to the blue_bucket. +36. Carter exited the porch. + +At this point, only Isla knows the true location of the banana. + +37. Jacob, Isla, Elizabeth, and Carter entered the waiting_room. +38. Isla privately told Elizabeth that the banana is in the red_drawer. +39. Carter privately told Nathan that the banana is in the blue_bucket. + +Now Elizabeth knows the true location of the banana, but Carter doesn't know that she knows. + +To answer the question, we need to track where Isla thinks the watermelon is and where Carter thinks Isla thinks the watermelon is. We know that Isla privately told Carter that the watermelon is in the blue_container, but we don't know if Carter believes her or not. + +Based on the given information, Elizabeth knows that the watermelon is in the blue_container, but she doesn't know if Carter knows this or not. Therefore, we cannot determine where Elizabeth thinks Carter thinks Isla thinks the watermelon is. + +The answer is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_9/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0c557653681a920c1bb55e15cc1034ebf2400ad7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/CoT/length_3/sample_9/order_4.txt @@ -0,0 +1,60 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Nathan think Elizabeth thinks Carter thinks Isla thinks the watermelon is? +Answer: blue_bottle +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bottle +GPT-4 Explain: This is a complex question that requires careful analysis. We need to trace the thoughts of Nathan, Elizabeth, Carter, and Isla regarding the location of the watermelon. + +First, Nathan did not make any movements in the kitchen and left before any of the others moved the watermelon. Therefore, he has no direct knowledge of the watermelon's location. + +Elizabeth moved the watermelon to the red_envelope before leaving the kitchen. However, we do not know what she thinks about its current location. + +Carter moved the watermelon to the blue_cupboard before leaving the kitchen. He publicly claimed that the watermelon is in the red_envelope, but Isla privately told him that it is in the blue_container. Therefore, we know that Carter is lying about the watermelon's location. + +Isla made no movements in the kitchen but privately told Carter that the watermelon is in the blue_container. Therefore, we know that Isla knows the true location of the watermelon. + +Based on these facts, we can conclude that Nathan thinks that Elizabeth thinks that Carter thinks that Isla thinks the watermelon is in the red_envelope. This is because Nathan has no direct knowledge of the watermelon's location, and Elizabeth moved it to the red_envelope before leaving the kitchen. Carter publicly claimed that the watermelon is in the red_envelope, so Nathan would assume that he thinks it is there. However, Isla privately told Carter that the watermelon is in the blue_container, so Nathan would assume that Isla thinks it is there. + +Therefore, the answer is J. red_envelope. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_1/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..88b8f10aeb6c9252b28238d172973412118460db --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_1/order_0.txt @@ -0,0 +1,27 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where is the carrot really? +Answer: red_basket +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: C. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_1/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6767aa941b1d733e3afc01c8548b82089ce59c44 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_1/order_1.txt @@ -0,0 +1,27 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does William really think the carrot is? +Answer: green_envelope +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_1/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a51d4d70fa8be3694e9e294fa384b7152a969477 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_1/order_2.txt @@ -0,0 +1,27 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does Hannah think William thinks the carrot is? +Answer: red_basket +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: Hannah thinks William thinks the carrot is in the red_basket. (Option B) \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_1/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6616130b3252c9c444b4f93f72cf5697950c44a6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_1/order_3.txt @@ -0,0 +1,27 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does Jack think Hannah thinks William thinks the carrot is? +Answer: red_basket +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: C. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_1/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b46ec62bebfe8f004bcb69bf51491bdf2e809b26 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_1/order_4.txt @@ -0,0 +1,27 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Jack, Charlotte, Noah and Hannah entered the hall. +2 Noah saw a monkey. +3 The carrot is in the red_basket. +4 William made no movements and stayed in the hall for 1 minute. +5 William exited the hall. +6 Hannah saw a mouse. +7 Jack made no movements and stayed in the hall for 1 minute. +8 Jack exited the hall. +9 Charlotte made no movements and stayed in the hall for 1 minute. +10 Charlotte exited the hall. +11 Charlotte dislikes the tomato. +12 Noah moved the carrot to the green_envelope. +13 Noah exited the hall. +14 Hannah moved the carrot to the red_basket. +15 Hannah exited the hall. +16 William, Jack, Charlotte, Noah and Hannah entered the waiting_room. +17 Charlotte publicly claimed that carrot is in the green_envelope. +18 Hannah privately told Charlotte that the carrot is in the blue_container. +Question: Where does Charlotte think Jack thinks Hannah thinks William thinks the carrot is? +Answer: red_basket +Choices: A. green_envelope, B. red_basket, C. blue_container, D. red_crate, E. green_drawer, F. blue_bucket, G. green_cupboard, H. red_bottle, I. green_treasure_chest, J. blue_cupboard, K. red_pantry, L. red_container, M. blue_bathtub, N. red_envelope, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: C. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_10/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..09f856a5f6d0497107fae1ef19340a4852003add --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_10/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where is the potato really? +Answer: green_cupboard +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_cupboard +GPT-4 Explain: C. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_10/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c763af572e0615e50e78ca92cac21c81a3e6d1c6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_10/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Carter really think the potato is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: A. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_10/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b9c042c487e98a24043803c46f94b216ecc09b5b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_10/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Jacob think Carter thinks the potato is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: N. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_10/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..867f7245eaa44b0705e9c8a574f07cdae80a291d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_10/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Alexander think Jacob thinks Carter thinks the potato is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: C. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_10/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d2c17c61e221ec90f132f59adffd14640d012dd5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_10/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Avery, Jacob, Jackson and Alexander entered the study. +2 The potato is in the blue_bathtub. +3 Carter made no movements and stayed in the study for 1 minute. +4 Carter exited the study. +5 Avery moved the potato to the blue_pantry. +6 Avery exited the study. +7 Jacob moved the potato to the green_cupboard. +8 Jacob exited the study. +9 Jackson made no movements and stayed in the study for 1 minute. +10 Jackson exited the study. +11 Alexander made no movements and stayed in the study for 1 minute. +12 Alexander exited the study. +13 Carter, Avery, Jacob, Jackson and Alexander entered the waiting_room. +14 Jacob publicly claimed that potato is in the blue_bathtub. +15 Alexander privately told Jacob that the potato is in the blue_bottle. +Question: Where does Jackson think Alexander thinks Jacob thinks Carter thinks the potato is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. green_cupboard, C. blue_bottle, D. green_drawer, E. blue_pantry, F. red_drawer, G. red_box, H. red_envelope, I. red_basket, J. green_treasure_chest, K. green_bucket, L. blue_drawer, M. green_basket, N. green_bathtub, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: N. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_11/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7f47755465a294fe3842668b1bcacddaa3adb31f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_11/order_0.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where is the pear really? +Answer: red_pantry +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: I. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_11/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cbe2230ec9e5eed94f03495b952014795202339e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_11/order_1.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Sophia really think the pear is? +Answer: red_pantry +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: F. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_11/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..cabd5a5d4db68d7323653046c1d6e27ce0429de9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_11/order_2.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Ava think Sophia thinks the pear is? +Answer: green_envelope +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: I. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_11/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..21d25c70b2e35aa322894bb86467354a268609e2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_11/order_3.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Avery think Ava thinks Sophia thinks the pear is? +Answer: green_envelope +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: I. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_11/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..782e40b62d0ffa1a6c1c6e7a775d947396ee7e22 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_11/order_4.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Avery, Isabella, Mila and Sophia entered the lounge. +2 The pear is in the blue_crate. +3 Ava moved the pear to the green_envelope. +4 Ava exited the lounge. +5 Avery moved the pear to the red_pantry. +6 Avery exited the lounge. +7 Isabella made no movements and stayed in the lounge for 1 minute. +8 Isabella exited the lounge. +9 Mila made no movements and stayed in the lounge for 1 minute. +10 Mila exited the lounge. +11 Sophia made no movements and stayed in the lounge for 1 minute. +12 Sophia exited the lounge. +13 Mila dislikes the pear. +14 Ava, Avery, Isabella, Mila and Sophia entered the waiting_room. +15 Isabella publicly claimed that pear is in the green_envelope. +16 Sophia privately told Isabella that the pear is in the blue_crate. +Question: Where does Mila think Avery thinks Ava thinks Sophia thinks the pear is? +Answer: green_envelope +Choices: A. blue_drawer, B. green_bucket, C. red_box, D. green_basket, E. red_container, F. blue_crate, G. blue_cupboard, H. red_pantry, I. green_envelope, J. red_crate, K. red_basket, L. green_treasure_chest, M. red_drawer, N. green_bathtub, O. red_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: D. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_12/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b6e5a316dc0119f23c51f67c3206b1a7bd6ee10b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_12/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where is the tangerine really? +Answer: red_basket +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: N. green_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_12/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a5090b263db23d99f9fc4f9737cf78c10eed3b48 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_12/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Ava really think the tangerine is? +Answer: red_basket +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: N. green_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_12/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..591b4f4f3edf757709d953b50894d2ab755b829b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_12/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Logan think Ava thinks the tangerine is? +Answer: green_box +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: M. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_12/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7905e8ac7f87cbd8ab8c86c070453a7a85f44155 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_12/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Owen think Logan thinks Ava thinks the tangerine is? +Answer: red_bottle +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bottle +GPT-4 Explain: M. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_12/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..967186986f86795a3657407f224f94a50ace2d56 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_12/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Logan, Elizabeth, Alexander and Ava entered the front_yard. +2 The tangerine is in the red_bottle. +3 Owen made no movements and stayed in the front_yard for 1 minute. +4 Owen exited the front_yard. +5 Logan moved the tangerine to the green_box. +6 Logan exited the front_yard. +7 Elizabeth moved the tangerine to the red_basket. +8 Elizabeth exited the front_yard. +9 Alexander made no movements and stayed in the front_yard for 1 minute. +10 Alexander exited the front_yard. +11 Ava made no movements and stayed in the front_yard for 1 minute. +12 Ava exited the front_yard. +13 Owen, Logan, Elizabeth, Alexander and Ava entered the waiting_room. +14 Elizabeth publicly claimed that tangerine is in the blue_crate. +15 Ava privately told Elizabeth that the tangerine is in the red_basket. +Question: Where does Elizabeth think Owen thinks Logan thinks Ava thinks the tangerine is? +Answer: red_bottle +Choices: A. red_drawer, B. red_bucket, C. blue_drawer, D. green_crate, E. blue_treasure_chest, F. green_drawer, G. green_bucket, H. red_pantry, I. green_envelope, J. blue_pantry, K. red_bottle, L. red_container, M. blue_crate, N. green_box, O. red_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bottle +GPT-4 Explain: M. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_13/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b9847a6b8a426f1ddc86296b90d8841f382e557b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_13/order_0.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where is the onion really? +Answer: red_crate +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: E. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_13/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..457ffe171b7de6f380846119bbf744c538a41ba0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_13/order_1.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Owen really think the onion is? +Answer: red_crate +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: E. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_13/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..64ab19aab43e20556f9fea3ec9b7ddaedf017304 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_13/order_2.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Elizabeth think Owen thinks the onion is? +Answer: green_bucket +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: E. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_13/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5501486a6431d7ac172cbe8b594a29a0f8ca76b2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_13/order_3.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Liam think Elizabeth thinks Owen thinks the onion is? +Answer: red_crate +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: E. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_13/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f592dbfd2059ceebddc39af25107341ffe6de37d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_13/order_4.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Liam, Elizabeth and Owen entered the cellar. +2 Jack dislikes the tomato. +3 The onion is in the red_crate. +4 Noah made no movements and stayed in the cellar for 1 minute. +5 Noah exited the cellar. +6 Jack made no movements and stayed in the cellar for 1 minute. +7 Jack exited the cellar. +8 Liam made no movements and stayed in the cellar for 1 minute. +9 Liam exited the cellar. +10 Jack saw a dog. +11 Elizabeth moved the onion to the green_bucket. +12 Elizabeth exited the cellar. +13 Owen moved the onion to the red_crate. +14 Owen exited the cellar. +15 Noah, Jack, Liam, Elizabeth and Owen entered the waiting_room. +16 Liam privately told Noah that the onion is in the green_bucket. +17 Jack privately told Elizabeth that the onion is in the red_crate. +Question: Where does Noah think Liam thinks Elizabeth thinks Owen thinks the onion is? +Answer: red_crate +Choices: A. red_crate, B. blue_bucket, C. red_envelope, D. red_bottle, E. green_bucket, F. green_bottle, G. blue_bathtub, H. blue_suitcase, I. blue_crate, J. blue_container, K. green_drawer, L. blue_treasure_chest, M. red_pantry, N. red_box, O. red_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: E. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_14/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..71a5ad7aec1f3b6850fb1a8e70525e5aa3251008 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_14/order_0.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where is the tangerine really? +Answer: green_treasure_chest +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: N. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_14/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9703df4dd37ec4e181dc0c5febd99a03748fd589 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_14/order_1.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Mila really think the tangerine is? +Answer: red_box +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: N. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_14/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..32f3044011e68391740880d2caf17005ecf1f08f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_14/order_2.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Amelia think Mila thinks the tangerine is? +Answer: red_box +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: N. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_14/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cfc57db61bb3c369b81c4ba411fe836a2d7751e2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_14/order_3.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Elizabeth think Amelia thinks Mila thinks the tangerine is? +Answer: green_treasure_chest +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: N. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_14/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..16f1f8cd4452155ab5ca966b3f0113a8d449b43a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_14/order_4.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the attic. +2 The tangerine is in the green_treasure_chest. +3 Mila made no movements and stayed in the attic for 1 minute. +4 Mila exited the attic. +5 Chloe made no movements and stayed in the attic for 1 minute. +6 Chloe exited the attic. +7 Amelia made no movements and stayed in the attic for 1 minute. +8 Chloe lost his watch. +9 Amelia exited the attic. +10 Benjamin moved the tangerine to the blue_pantry. +11 Benjamin exited the attic. +12 Elizabeth moved the tangerine to the green_treasure_chest. +13 Elizabeth exited the attic. +14 Mila, Chloe, Amelia, Benjamin and Elizabeth entered the waiting_room. +15 Amelia privately told Mila that the tangerine is in the red_box. +16 Chloe privately told Benjamin that the tangerine is in the green_treasure_chest. +Question: Where does Chloe think Elizabeth thinks Amelia thinks Mila thinks the tangerine is? +Answer: green_treasure_chest +Choices: A. blue_crate, B. green_envelope, C. green_drawer, D. red_crate, E. red_bottle, F. green_bottle, G. green_bathtub, H. blue_treasure_chest, I. green_basket, J. red_pantry, K. green_treasure_chest, L. blue_pantry, M. red_bucket, N. red_box, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: N. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_15/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a26089d0cc70d014d3da9f1a85d12a340be065a8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_15/order_0.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where is the tangerine really? +Answer: red_basket +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: L. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_15/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2580bdb77ec0e6aae15ac837581bc6c5992bc3ec --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_15/order_1.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Amelia really think the tangerine is? +Answer: green_bottle +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: L. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_15/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3c2e7b732c1e2a8aae90e851f19cd8169023dc81 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_15/order_2.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Ava think Amelia thinks the tangerine is? +Answer: red_basket +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: L. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_15/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b2dea37be30c83d5bde8b99d750c8cf55dc85257 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_15/order_3.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Carter think Ava thinks Amelia thinks the tangerine is? +Answer: red_basket +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: N. red_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_15/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2d90ab02a562daea5d89550634a7dfc3c73c282b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_15/order_4.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Sophia, Amelia, Abigail and Carter entered the cellar. +2 The tangerine is in the red_basket. +3 Ava made no movements and stayed in the cellar for 1 minute. +4 Ava exited the cellar. +5 Sophia moved the tangerine to the green_bottle. +6 Sophia exited the cellar. +7 Amelia made no movements and stayed in the cellar for 1 minute. +8 Amelia exited the cellar. +9 Abigail moved the tangerine to the red_crate. +10 Abigail exited the cellar. +11 Carter moved the tangerine to the red_basket. +12 Carter exited the cellar. +13 Ava dislikes the corn. +14 Ava, Sophia, Amelia, Abigail and Carter entered the waiting_room. +15 Abigail publicly claimed that tangerine is in the green_bottle. +16 Carter privately told Ava that the tangerine is in the red_basket. +Question: Where does Abigail think Carter thinks Ava thinks Amelia thinks the tangerine is? +Answer: red_basket +Choices: A. green_crate, B. green_drawer, C. blue_crate, D. blue_bathtub, E. green_pantry, F. green_box, G. blue_pantry, H. red_box, I. green_bucket, J. red_bucket, K. green_bottle, L. red_basket, M. blue_cupboard, N. red_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: N. red_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_16/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d12f36b204c4bbcdc1ba0b504ede09cfa6ed555f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_16/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where is the tomato really? +Answer: red_crate +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: The tomato is in the green_box. (Answer: M) \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_16/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e6ed9be2486dcd56212ff09b9f5eba9197b35b98 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_16/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Jack really think the tomato is? +Answer: green_box +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: M. green_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_16/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..56b61aed70207269b5435d39f88f73b59fc5b120 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_16/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Isla think Jack thinks the tomato is? +Answer: green_basket +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: M. green_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_16/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..27ff492edd17eb220f0dbbfe39a207aabe118584 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_16/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Carter think Isla thinks Jack thinks the tomato is? +Answer: red_crate +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: M. green_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_16/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..dc0303ae0938c98901ae3e4cd75111ddd1753cf8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_16/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden, Isla, Carter, Jack and Evelyn entered the closet. +2 The tomato is in the red_crate. +3 Aiden made no movements and stayed in the closet for 1 minute. +4 Aiden exited the closet. +5 Isla made no movements and stayed in the closet for 1 minute. +6 Isla exited the closet. +7 Carter moved the tomato to the blue_container. +8 Carter exited the closet. +9 Jack moved the tomato to the green_box. +10 Jack exited the closet. +11 Evelyn moved the tomato to the red_crate. +12 Evelyn exited the closet. +13 Aiden, Isla, Carter, Jack and Evelyn entered the waiting_room. +14 Carter privately told Aiden that the tomato is in the green_box. +15 Isla privately told Jack that the tomato is in the green_basket. +Question: Where does Aiden think Carter thinks Isla thinks Jack thinks the tomato is? +Answer: red_crate +Choices: A. red_basket, B. green_pantry, C. blue_suitcase, D. green_bucket, E. red_envelope, F. green_drawer, G. green_bathtub, H. green_cupboard, I. blue_treasure_chest, J. red_drawer, K. blue_bottle, L. red_crate, M. green_box, N. blue_container, O. green_basket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: M. green_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_17/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6cc7d3e7bb7d30eb3a11bd5236ccbb1549199d19 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_17/order_0.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where is the green_pepper really? +Answer: blue_treasure_chest +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: J. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_17/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..50151149290776ccf866ea1e5a05add4819480e5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_17/order_1.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Alexander really think the green_pepper is? +Answer: blue_crate +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: I. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_17/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c666d66ec6716763e147fe78208b9813333d912f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_17/order_2.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Evelyn think Alexander thinks the green_pepper is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: J. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_17/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e7b313e1b2dfc5a7625b2e9193c958d7461d9e66 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_17/order_3.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Hannah think Evelyn thinks Alexander thinks the green_pepper is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: J. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_17/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..82ed4fc01234345de6d89e371a05d2195755be25 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_17/order_4.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Alexander, Evelyn, Hannah, Abigail and Noah entered the den. +2 The green_pepper is in the blue_crate. +3 Alexander moved the green_pepper to the blue_suitcase. +4 Alexander exited the den. +5 Evelyn moved the green_pepper to the blue_treasure_chest. +6 Evelyn exited the den. +7 Hannah made no movements and stayed in the den for 1 minute. +8 Hannah exited the den. +9 Abigail made no movements and stayed in the den for 1 minute. +10 Abigail exited the den. +11 Noah made no movements and stayed in the den for 1 minute. +12 Noah exited the den. +13 Alexander, Evelyn, Hannah, Abigail and Noah entered the waiting_room. +14 Evelyn likes the green_cupboard. +15 Hannah privately told Alexander that the green_pepper is in the blue_crate. +16 Evelyn privately told Abigail that the green_pepper is in the green_envelope. +Question: Where does Abigail think Hannah thinks Evelyn thinks Alexander thinks the green_pepper is? +Answer: blue_suitcase +Choices: A. blue_bathtub, B. blue_bucket, C. green_treasure_chest, D. red_basket, E. green_bathtub, F. green_envelope, G. blue_crate, H. red_crate, I. blue_suitcase, J. blue_treasure_chest, K. blue_pantry, L. green_bucket, M. green_cupboard, N. green_bottle, O. red_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: J. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_18/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4938d90155519941c3aabb32613055536e58ca38 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_18/order_0.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where is the cabbage really? +Answer: red_box +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: D. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_18/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..303d7540062a96d42aa123cc7634a01e88e67d77 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_18/order_1.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does William really think the cabbage is? +Answer: red_box +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: E. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_18/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a17037167931b1a934b18c814ffb1827aa367467 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_18/order_2.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does Nathan think William thinks the cabbage is? +Answer: red_box +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: D. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_18/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cffc7e82e48ef76d0c942d51d2bb1bbecc974540 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_18/order_3.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does Aiden think Nathan thinks William thinks the cabbage is? +Answer: red_box +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: E. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_18/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..bed7de954cb9451bfb32a943996fbdd3f8c8370c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_18/order_4.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Nathan, Isabella, Aiden and William entered the master_bedroom. +2 William lost his gloves. +3 The cabbage is in the red_bucket. +4 Logan moved the cabbage to the green_pantry. +5 Aiden lost his gloves. +6 Logan exited the master_bedroom. +7 Nathan moved the cabbage to the red_box. +8 Nathan exited the master_bedroom. +9 Isabella made no movements and stayed in the master_bedroom for 1 minute. +10 Isabella exited the master_bedroom. +11 Aiden made no movements and stayed in the master_bedroom for 1 minute. +12 Aiden exited the master_bedroom. +13 William made no movements and stayed in the master_bedroom for 1 minute. +14 William exited the master_bedroom. +15 Logan, Nathan, Isabella, Aiden and William entered the waiting_room. +16 Isabella publicly claimed that cabbage is in the red_box. +17 William privately told Isabella that the cabbage is in the green_cupboard. +Question: Where does Logan think Aiden thinks Nathan thinks William thinks the cabbage is? +Answer: green_pantry +Choices: A. blue_treasure_chest, B. red_bucket, C. green_pantry, D. red_box, E. green_cupboard, F. blue_pantry, G. green_treasure_chest, H. red_crate, I. green_basket, J. blue_suitcase, K. blue_container, L. blue_drawer, M. red_drawer, N. red_pantry, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: D. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_19/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e314bbcd9ec8b677890404ef0d2e2726e5950ccb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_19/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where is the green_pepper really? +Answer: blue_crate +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: B. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_19/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b8a43a724ec6fc9691e0ba308be4bb754ef21117 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_19/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Logan really think the green_pepper is? +Answer: blue_crate +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: D. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_19/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..92d86eb382f54a0222bd0fb886e7c205ba81d97f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_19/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Lily think Logan thinks the green_pepper is? +Answer: red_drawer +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: D. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_19/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..22a0f5e2391555625190383a22f5cec146fe144f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_19/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Ella think Lily thinks Logan thinks the green_pepper is? +Answer: red_drawer +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: D. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_19/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..78019e445190cb200f5fd9035a519f4c3402d275 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_19/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Lily, Ella, Logan and Elizabeth entered the den. +2 The green_pepper is in the red_drawer. +3 Abigail made no movements and stayed in the den for 1 minute. +4 Abigail exited the den. +5 Lily made no movements and stayed in the den for 1 minute. +6 Lily exited the den. +7 Ella made no movements and stayed in the den for 1 minute. +8 Ella exited the den. +9 Logan moved the green_pepper to the blue_crate. +10 Logan exited the den. +11 Elizabeth made no movements and stayed in the den for 1 minute. +12 Elizabeth exited the den. +13 Abigail, Lily, Ella, Logan and Elizabeth entered the waiting_room. +14 Ella publicly claimed that green_pepper is in the red_pantry. +15 Elizabeth privately told Ella that the green_pepper is in the red_drawer. +Question: Where does Elizabeth think Ella thinks Lily thinks Logan thinks the green_pepper is? +Answer: red_drawer +Choices: A. red_pantry, B. red_drawer, C. red_bottle, D. blue_crate, E. green_box, F. green_envelope, G. blue_container, H. blue_treasure_chest, I. blue_bottle, J. green_crate, K. blue_cupboard, L. red_container, M. blue_pantry, N. green_bathtub, O. green_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: D. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_2/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..50f5c53ca65b56edc6d13a498579219bdb2ef859 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_2/order_0.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where is the lemon really? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: E. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_2/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4b8f7f29efcda989dad05e95d245a7c7a7d48167 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_2/order_1.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Lily really think the lemon is? +Answer: blue_bathtub +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: E. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_2/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..266a90703d959b65d62fc0ac40cd1619a401bdf6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_2/order_2.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Avery think Lily thinks the lemon is? +Answer: blue_pantry +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: D. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_2/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7fec302a4cf668dc088dc2df783d9d47bd0cf6ec --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_2/order_3.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Liam think Avery thinks Lily thinks the lemon is? +Answer: blue_treasure_chest +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: D. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_2/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..26f327f0ac2365a98d1325f194221877ba6fdd7d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_2/order_4.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Liam, Avery, Noah and Lily entered the garage. +2 The lemon is in the blue_bathtub. +3 Abigail moved the lemon to the blue_treasure_chest. +4 Lily dislikes the cabbage. +5 Abigail exited the garage. +6 Liam made no movements and stayed in the garage for 1 minute. +7 Liam exited the garage. +8 Avery moved the lemon to the blue_pantry. +9 Avery exited the garage. +10 Noah made no movements and stayed in the garage for 1 minute. +11 Noah exited the garage. +12 Lily moved the lemon to the blue_bathtub. +13 Lily exited the garage. +14 Abigail, Liam, Avery, Noah and Lily entered the waiting_room. +15 Abigail lost his watch. +16 Avery privately told Abigail that the lemon is in the green_drawer. +17 Liam privately told Noah that the lemon is in the blue_treasure_chest. +Question: Where does Noah think Liam thinks Avery thinks Lily thinks the lemon is? +Answer: blue_treasure_chest +Choices: A. blue_bathtub, B. red_envelope, C. blue_pantry, D. green_drawer, E. blue_treasure_chest, F. blue_crate, G. blue_cupboard, H. green_pantry, I. blue_drawer, J. green_envelope, K. red_drawer, L. red_bucket, M. green_box, N. red_container, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: D. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_20/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..bc7be08853dfd2c2891854b02c236ce2db37843f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_20/order_0.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where is the peach really? +Answer: blue_treasure_chest +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: M. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_20/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fd68c11982609c8d9cd7b30f17cd72824a6566b6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_20/order_1.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Avery really think the peach is? +Answer: blue_treasure_chest +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: M. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_20/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6d3a96a2ce5a89342f94b31c5bfa3e3d8139e2bc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_20/order_2.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Liam think Avery thinks the peach is? +Answer: red_bottle +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bottle +GPT-4 Explain: N. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_20/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..33ef7f360d18e397dce8b570fcc8186b0d26fad8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_20/order_3.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Benjamin think Liam thinks Avery thinks the peach is? +Answer: blue_treasure_chest +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: M. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_20/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d8b6f20047b2eda76883027211dc425c08f3fee9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_20/order_4.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Liam, Benjamin, Avery and Mila entered the patio. +2 Liam lost his gloves. +3 The peach is in the red_basket. +4 Hannah made no movements and stayed in the patio for 1 minute. +5 Hannah exited the patio. +6 Liam moved the peach to the blue_treasure_chest. +7 Liam exited the patio. +8 Benjamin made no movements and stayed in the patio for 1 minute. +9 Benjamin exited the patio. +10 Avery made no movements and stayed in the patio for 1 minute. +11 Avery exited the patio. +12 Mila made no movements and stayed in the patio for 1 minute. +13 Mila exited the patio. +14 Hannah, Liam, Benjamin, Avery and Mila entered the waiting_room. +15 Liam lost his gloves. +16 Benjamin privately told Hannah that the peach is in the red_envelope. +17 Liam privately told Avery that the peach is in the red_bottle. +Question: Where does Hannah think Benjamin thinks Liam thinks Avery thinks the peach is? +Answer: red_basket +Choices: A. blue_bucket, B. blue_drawer, C. red_container, D. green_basket, E. blue_bathtub, F. red_drawer, G. green_bathtub, H. green_crate, I. green_envelope, J. green_drawer, K. red_pantry, L. red_basket, M. red_envelope, N. red_bottle, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: M. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_3/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2f410a9421be74108e264f23d8d5f64d34b9eafa --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_3/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where is the onion really? +Answer: red_drawer +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: B. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_3/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ea5acec2e8227715efa921573c12aa778dc34641 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_3/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Lily really think the onion is? +Answer: red_drawer +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: B. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_3/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e40afe3338383a97a3b984fe47097d8e90fe3426 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_3/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Avery think Lily thinks the onion is? +Answer: red_drawer +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: N. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_3/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c4ba096f1808b632d4a8673b553b2e5dffa3b892 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_3/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Emily think Avery thinks Lily thinks the onion is? +Answer: blue_pantry +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: B. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_3/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3f0d6132bca458b55b291bb2ea2109bdd5706aa0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_3/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Liam, Avery, Elizabeth and Lily entered the hallway. +2 The onion is in the green_crate. +3 Emily moved the onion to the blue_pantry. +4 Emily exited the hallway. +5 Liam moved the onion to the red_drawer. +6 Liam exited the hallway. +7 Avery made no movements and stayed in the hallway for 1 minute. +8 Avery exited the hallway. +9 Elizabeth made no movements and stayed in the hallway for 1 minute. +10 Elizabeth exited the hallway. +11 Lily made no movements and stayed in the hallway for 1 minute. +12 Lily exited the hallway. +13 Emily, Liam, Avery, Elizabeth and Lily entered the waiting_room. +14 Avery privately told Emily that the onion is in the blue_bottle. +15 Liam privately told Elizabeth that the onion is in the blue_treasure_chest. +Question: Where does Elizabeth think Emily thinks Avery thinks Lily thinks the onion is? +Answer: blue_pantry +Choices: A. green_crate, B. blue_bottle, C. blue_treasure_chest, D. blue_pantry, E. red_drawer, F. red_container, G. green_envelope, H. green_drawer, I. red_basket, J. green_basket, K. red_envelope, L. green_bathtub, M. blue_crate, N. green_pantry, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: D. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_4/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2d1776b97ee00dec25a446a2704c00f84d046570 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_4/order_0.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where is the cherry really? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: L. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_4/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b52810a1e6cde92c56ea9cd1ebb994621e87f72 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_4/order_1.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Jackson really think the cherry is? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: L. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_4/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..15f36eaa2e6c2b10921d35dcb78a17ede82434b1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_4/order_2.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Benjamin think Jackson thinks the cherry is? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: L. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_4/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..84f8339ed57d837f9f1345773b65c45edc98eb69 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_4/order_3.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Mila think Benjamin thinks Jackson thinks the cherry is? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: K. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_4/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b8fd3d9939ffa444a2734bd3954104e09d33f6c7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_4/order_4.txt @@ -0,0 +1,24 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Jackson, Avery, Abigail and Mila entered the master_bedroom. +2 The cherry is in the green_bucket. +3 Benjamin made no movements and stayed in the master_bedroom for 1 minute. +4 Benjamin exited the master_bedroom. +5 Jackson made no movements and stayed in the master_bedroom for 1 minute. +6 Jackson exited the master_bedroom. +7 Avery made no movements and stayed in the master_bedroom for 1 minute. +8 Avery exited the master_bedroom. +9 Abigail made no movements and stayed in the master_bedroom for 1 minute. +10 Abigail exited the master_bedroom. +11 Mila made no movements and stayed in the master_bedroom for 1 minute. +12 Mila exited the master_bedroom. +13 Benjamin, Jackson, Avery, Abigail and Mila entered the waiting_room. +14 Avery privately told Benjamin that the cherry is in the blue_crate. +15 Jackson privately told Abigail that the cherry is in the green_bucket. +Question: Where does Abigail think Mila thinks Benjamin thinks Jackson thinks the cherry is? +Answer: green_bucket +Choices: A. blue_bottle, B. blue_suitcase, C. green_cupboard, D. red_drawer, E. red_pantry, F. blue_cupboard, G. red_basket, H. green_envelope, I. blue_bathtub, J. red_bottle, K. blue_crate, L. green_bucket, M. green_bottle, N. green_treasure_chest, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: L. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_5/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8af59acca977cceae6281f5d0a6f287f7e4272af --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_5/order_0.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where is the asparagus really? +Answer: blue_drawer +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: N. red_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_5/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..80bbcd5a878b17a0145c3ce90c2bdf94390881a0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_5/order_1.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Logan really think the asparagus is? +Answer: blue_drawer +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: N. red_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_5/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..16c5f04eb99d1efb6eb4f4737c81c0ea5aaf0d56 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_5/order_2.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Sophia think Logan thinks the asparagus is? +Answer: red_crate +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: N. red_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_5/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..547bf9ac05e12ba979d4a8a9bc1fb79c62b403d4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_5/order_3.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Elizabeth think Sophia thinks Logan thinks the asparagus is? +Answer: blue_drawer +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: N. red_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_5/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7438cb0dda471b86c2906c632bf0738a21d55e5c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_5/order_4.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Elizabeth dislikes the orange. +2 Hannah, Emma, Elizabeth, Sophia and Logan entered the garage. +3 The asparagus is in the blue_drawer. +4 Hannah made no movements and stayed in the garage for 1 minute. +5 Hannah exited the garage. +6 Emma made no movements and stayed in the garage for 1 minute. +7 Emma exited the garage. +8 Elizabeth made no movements and stayed in the garage for 1 minute. +9 Elizabeth exited the garage. +10 Sophia made no movements and stayed in the garage for 1 minute. +11 Sophia exited the garage. +12 Logan made no movements and stayed in the garage for 1 minute. +13 Logan saw a dog. +14 Logan exited the garage. +15 Hannah, Emma, Elizabeth, Sophia and Logan entered the waiting_room. +16 Sophia publicly claimed that asparagus is in the red_crate. +17 Logan privately told Hannah that the asparagus is in the blue_drawer. +Question: Where does Hannah think Elizabeth thinks Sophia thinks Logan thinks the asparagus is? +Answer: blue_drawer +Choices: A. green_treasure_chest, B. green_bottle, C. green_drawer, D. green_envelope, E. red_bottle, F. red_box, G. blue_crate, H. red_envelope, I. red_drawer, J. red_container, K. blue_treasure_chest, L. blue_drawer, M. blue_pantry, N. red_crate, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: N. red_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_6/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..03386a8ea880f16a4f3755cbae96880c0331ea71 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_6/order_0.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where is the watermelon really? +Answer: green_basket +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_6/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6acb01a4b558ad78925d0f6af70c9ee49cd09d8e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_6/order_1.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does William really think the watermelon is? +Answer: green_basket +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_6/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..31d06b505a6be2dc93592444b786a9b49b8e632b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_6/order_2.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does Carter think William thinks the watermelon is? +Answer: green_basket +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: D. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_6/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c04f962e8c70176c5fbb9eb93a47b68c187cebed --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_6/order_3.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does Owen think Carter thinks William thinks the watermelon is? +Answer: green_envelope +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: C. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_6/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..757df9b5b3ff1d0313c0cbfff32e0415f43f5c72 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_6/order_4.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen, Jacob, Emma, William and Carter entered the sunroom. +2 The watermelon is in the green_crate. +3 Owen moved the watermelon to the green_envelope. +4 Owen exited the sunroom. +5 Jacob moved the watermelon to the green_bucket. +6 Jacob exited the sunroom. +7 Emma moved the watermelon to the blue_pantry. +8 Emma exited the sunroom. +9 William moved the watermelon to the green_basket. +10 William exited the sunroom. +11 Jacob dislikes the grapes. +12 Carter made no movements and stayed in the sunroom for 1 minute. +13 Carter exited the sunroom. +14 Owen, Jacob, Emma, William and Carter entered the waiting_room. +15 Emma privately told Owen that the watermelon is in the green_bucket. +16 Jacob privately told William that the watermelon is in the green_envelope. +Question: Where does Emma think Owen thinks Carter thinks William thinks the watermelon is? +Answer: green_envelope +Choices: A. green_crate, B. green_envelope, C. green_basket, D. green_bucket, E. blue_pantry, F. green_cupboard, G. red_drawer, H. red_container, I. blue_cupboard, J. green_treasure_chest, K. red_box, L. blue_bathtub, M. green_bottle, N. blue_drawer, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: E. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_7/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..800ffb21f9359a65fcbe67796ade84ee7fedbd0c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_7/order_0.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where is the tomato really? +Answer: green_drawer +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: N. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_7/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..007774fabee4c3b11f47b708f8a95303b4faf66a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_7/order_1.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Emma really think the tomato is? +Answer: green_drawer +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: N. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_7/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..eb582bce762372665c45d829ac673235a58713b9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_7/order_2.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Liam think Emma thinks the tomato is? +Answer: red_container +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: N. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_7/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..54e77f20bc13a41944cdfdb36d2e5a6c6148ba11 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_7/order_3.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Hannah think Liam thinks Emma thinks the tomato is? +Answer: red_container +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: N. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_7/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..186830a4462d2819eadf1087c6b414e35b84e17b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_7/order_4.txt @@ -0,0 +1,26 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, Hannah, Liam, Nathan and Carter entered the study. +2 Emma saw a cat. +3 The tomato is in the red_container. +4 Emma made no movements and stayed in the study for 1 minute. +5 Emma exited the study. +6 Hannah made no movements and stayed in the study for 1 minute. +7 Hannah exited the study. +8 Carter dislikes the banana. +9 Liam moved the tomato to the green_drawer. +10 Liam exited the study. +11 Nathan made no movements and stayed in the study for 1 minute. +12 Nathan exited the study. +13 Carter made no movements and stayed in the study for 1 minute. +14 Carter exited the study. +15 Emma, Hannah, Liam, Nathan and Carter entered the waiting_room. +16 Nathan publicly claimed that tomato is in the blue_bottle. +17 Carter privately told Emma that the tomato is in the green_drawer. +Question: Where does Carter think Hannah thinks Liam thinks Emma thinks the tomato is? +Answer: red_container +Choices: A. blue_bathtub, B. red_drawer, C. green_bathtub, D. green_envelope, E. blue_cupboard, F. green_box, G. blue_drawer, H. green_pantry, I. green_cupboard, J. blue_treasure_chest, K. red_bottle, L. red_container, M. green_bucket, N. green_drawer, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: N. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_8/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..afe51489db91ce442e13c207e94c8eaa1e654d2b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_8/order_0.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where is the lettuce really? +Answer: red_bucket +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: L. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_8/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..67aa1ce72a9e817e44a2d9c7370ff6d3f713f60b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_8/order_1.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Isla really think the lettuce is? +Answer: red_box +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: L. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_8/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1da4a1e6b0f7641fc971c6b60cdf97320a41c34a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_8/order_2.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Benjamin think Isla thinks the lettuce is? +Answer: red_box +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: L. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_8/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c46cea6c80fd46751885ac5e97824648efec6d8a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_8/order_3.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Sophia think Benjamin thinks Isla thinks the lettuce is? +Answer: red_box +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: L. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_8/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2cfe68ff07f0924edc09a89759e29cd11587da85 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_8/order_4.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Isla, Benjamin, Alexander and Emily entered the living_room. +2 The lettuce is in the red_bucket. +3 Sophia moved the lettuce to the red_box. +4 Sophia exited the living_room. +5 Isla made no movements and stayed in the living_room for 1 minute. +6 Isla exited the living_room. +7 Benjamin made no movements and stayed in the living_room for 1 minute. +8 Benjamin exited the living_room. +9 Alexander moved the lettuce to the red_pantry. +10 Alexander exited the living_room. +11 Emily moved the lettuce to the red_bucket. +12 Emily exited the living_room. +13 Sophia, Isla, Benjamin, Alexander and Emily entered the waiting_room. +14 Benjamin privately told Sophia that the lettuce is in the red_bucket. +15 Isla lost his phone. +16 Isla privately told Alexander that the lettuce is in the red_pantry. +Question: Where does Emily think Sophia thinks Benjamin thinks Isla thinks the lettuce is? +Answer: red_box +Choices: A. blue_bathtub, B. red_crate, C. red_bottle, D. green_envelope, E. green_treasure_chest, F. blue_bottle, G. blue_treasure_chest, H. green_cupboard, I. blue_container, J. green_basket, K. red_bucket, L. red_pantry, M. blue_cupboard, N. blue_suitcase, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: L. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_9/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..060fec73dfb8d2e8c78e64f88d3b75550a509021 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_9/order_0.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where is the spinach really? +Answer: blue_suitcase +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: F. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_9/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..328eb162c3842bc7255db363d97aa11b5fcbbd78 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_9/order_1.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Abigail really think the spinach is? +Answer: red_container +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: F. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_9/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9fedf59b07142fb7e1f9ff2022d39b06623e7c7e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_9/order_2.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Owen think Abigail thinks the spinach is? +Answer: blue_suitcase +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: G. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_9/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..362a32f0436a36aaef0e9095392d5a3c42289fbf --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_9/order_3.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Aiden think Owen thinks Abigail thinks the spinach is? +Answer: blue_suitcase +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: I. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_9/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2e9d1b7cdfc98dad272dc63b1c1bfc6176a8d25d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_1/sample_9/order_4.txt @@ -0,0 +1,25 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Owen, Amelia, Jack and Aiden entered the laundry. +2 The spinach is in the blue_suitcase. +3 Abigail made no movements and stayed in the laundry for 1 minute. +4 Abigail exited the laundry. +5 Owen moved the spinach to the red_basket. +6 Owen exited the laundry. +7 Amelia made no movements and stayed in the laundry for 1 minute. +8 Amelia exited the laundry. +9 Jack moved the spinach to the green_pantry. +10 Abigail dislikes the lemon. +11 Jack exited the laundry. +12 Aiden moved the spinach to the blue_suitcase. +13 Aiden exited the laundry. +14 Abigail, Owen, Amelia, Jack and Aiden entered the waiting_room. +15 Amelia publicly claimed that spinach is in the red_container. +16 Aiden privately told Amelia that the spinach is in the blue_suitcase. +Question: Where does Jack think Aiden thinks Owen thinks Abigail thinks the spinach is? +Answer: blue_suitcase +Choices: A. red_envelope, B. blue_bottle, C. green_crate, D. red_pantry, E. blue_treasure_chest, F. blue_suitcase, G. red_basket, H. red_container, I. green_pantry, J. green_bathtub, K. blue_bucket, L. green_bucket, M. red_drawer, N. blue_pantry, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: I. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_1/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad12ff761f2dfc4b7c9a5bc8a68593043d58149a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_1/order_0.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where is the persimmon really? +Answer: green_drawer +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: H. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_1/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1c20c0bd0ac9215167a34306716bcc1afaa747cf --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_1/order_1.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Owen really think the persimmon is? +Answer: blue_bottle +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bottle +GPT-4 Explain: G. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_1/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc45b4845029b31450237bb6905f90a45d1760f2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_1/order_2.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Amelia think Owen thinks the persimmon is? +Answer: blue_pantry +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: J. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_1/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..54dc3916eda9507e2535b8f20a9f3fd6d482c6c4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_1/order_3.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Aiden think Amelia thinks Owen thinks the persimmon is? +Answer: blue_pantry +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: J. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_1/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7d56ca9878a2f713f48dbfcac3b8c3ec14b68122 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_1/order_4.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Owen, Aiden, Ella and Amelia entered the closet. +2 The persimmon is in the blue_pantry. +3 Sophia made no movements and stayed in the closet for 1 minute. +4 Sophia exited the closet. +5 Owen made no movements and stayed in the closet for 1 minute. +6 Owen exited the closet. +7 Aiden moved the persimmon to the green_treasure_chest. +8 Aiden exited the closet. +9 Ella made no movements and stayed in the closet for 1 minute. +10 Ella exited the closet. +11 Amelia moved the persimmon to the blue_pantry. +12 Amelia exited the closet. +13 Aiden saw a monkey. +14 Sophia, Owen, Aiden, Ella and Amelia entered the waiting_room. +15 Amelia, Aiden and Ella entered the closet. +16 Ella saw a mouse. +17 The persimmon is in the blue_pantry. +18 Amelia moved the persimmon to the green_drawer. +19 Amelia exited the closet. +20 Aiden made no movements and stayed in the closet for 1 minute. +21 Aiden exited the closet. +22 Ella made no movements and stayed in the closet for 1 minute. +23 Ella exited the closet. +24 Amelia, Aiden and Ella entered the waiting_room. +25 Sophia likes the red_drawer. +26 Ella publicly claimed that persimmon is in the blue_bottle. +27 Amelia privately told Ella that the persimmon is in the red_box. +Question: Where does Ella think Aiden thinks Amelia thinks Owen thinks the persimmon is? +Answer: blue_pantry +Choices: A. green_bathtub, B. red_drawer, C. green_basket, D. red_bottle, E. red_container, F. green_drawer, G. blue_pantry, H. red_box, I. green_treasure_chest, J. blue_bottle, K. red_bucket, L. green_pantry, M. red_crate, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: J. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_10/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2755a7634f6c60e9c31e4d7df5295510643cfb94 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_10/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where is the persimmon really? +Answer: green_pantry +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: K. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_10/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2a0d2a3ce1427f57d470ece8c959942213aa7bb3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_10/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Ava really think the persimmon is? +Answer: blue_crate +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: M. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_10/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d8d7d547bb139cf4409fdf204c1f399faab85aad --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_10/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Evelyn think Ava thinks the persimmon is? +Answer: blue_crate +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: M. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_10/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..10d137f9d7876aee2fceee7343c2f006a2465a0c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_10/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Charlotte think Evelyn thinks Ava thinks the persimmon is? +Answer: blue_crate +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: M. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_10/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7d983c6a5da9290fa983d10c13ed96eec280ea4a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_10/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the bathroom. +2 The persimmon is in the blue_crate. +3 Ava made no movements and stayed in the bathroom for 1 minute. +4 Ava exited the bathroom. +5 Charlotte moved the persimmon to the red_crate. +6 Charlotte exited the bathroom. +7 Evelyn moved the persimmon to the blue_cupboard. +8 Evelyn exited the bathroom. +9 Amelia moved the persimmon to the green_pantry. +10 Amelia exited the bathroom. +11 Benjamin made no movements and stayed in the bathroom for 1 minute. +12 Benjamin exited the bathroom. +13 Ava, Charlotte, Evelyn, Amelia and Benjamin entered the waiting_room. +14 Ava, Benjamin and Evelyn entered the office. +15 The onion is in the blue_bathtub. +16 Ava moved the onion to the green_box. +17 Ava exited the office. +18 Benjamin made no movements and stayed in the office for 1 minute. +19 Benjamin exited the office. +20 Evelyn made no movements and stayed in the office for 1 minute. +21 Evelyn exited the office. +22 Ava, Benjamin and Evelyn entered the waiting_room. +23 Benjamin privately told Evelyn that the onion is in the red_container. +24 Evelyn privately told Amelia that the onion is in the green_box. +Question: Where does Benjamin think Charlotte thinks Evelyn thinks Ava thinks the persimmon is? +Answer: blue_crate +Choices: A. green_box, B. blue_bathtub, C. green_bucket, D. green_cupboard, E. red_container, F. red_envelope, G. red_pantry, H. blue_suitcase, I. green_crate, J. green_drawer, K. green_pantry, L. blue_crate, M. blue_cupboard, N. red_crate, O. blue_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: N. red_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_11/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a6ded693e145f0c2bcf6bf334946e2366d1645d3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_11/order_0.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where is the grapes really? +Answer: blue_pantry +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: O. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_11/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6385ff2a2170e4aa82e0ea4d8e0ffa038a522879 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_11/order_1.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Benjamin really think the grapes is? +Answer: blue_suitcase +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: O. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_11/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..416df615be32d2f906102dec024a81986c72aa12 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_11/order_2.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Liam think Benjamin thinks the grapes is? +Answer: blue_suitcase +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: N. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_11/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b4f9caccdb1e647de4cd9942c36dde02dbebc1c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_11/order_3.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Elizabeth think Liam thinks Benjamin thinks the grapes is? +Answer: blue_suitcase +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: K. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_11/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8ad490639ab771ddd328782ff0b699031f902b4f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_11/order_4.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Liam, Elizabeth, Alexander and Owen entered the workshop. +2 The grapes is in the blue_pantry. +3 Benjamin moved the grapes to the blue_suitcase. +4 Benjamin exited the workshop. +5 Liam made no movements and stayed in the workshop for 1 minute. +6 Liam exited the workshop. +7 Alexander lost his gloves. +8 Elizabeth made no movements and stayed in the workshop for 1 minute. +9 Elizabeth exited the workshop. +10 Benjamin lost his phone. +11 Alexander moved the grapes to the red_crate. +12 Alexander exited the workshop. +13 Owen moved the grapes to the blue_pantry. +14 Owen exited the workshop. +15 Liam likes the red_bucket. +16 Benjamin, Liam, Elizabeth, Alexander and Owen entered the waiting_room. +17 Owen, Alexander and Benjamin entered the garage. +18 Liam saw a mouse. +19 The watermelon is in the green_envelope. +20 Owen moved the watermelon to the red_drawer. +21 Owen exited the garage. +22 Alexander made no movements and stayed in the garage for 1 minute. +23 Alexander exited the garage. +24 Benjamin moved the watermelon to the red_pantry. +25 Benjamin exited the garage. +26 Owen, Alexander and Benjamin entered the waiting_room. +27 Benjamin publicly claimed that watermelon is in the green_pantry. +28 Owen saw a monkey. +29 Owen privately told Benjamin that the watermelon is in the red_pantry. +Question: Where does Alexander think Elizabeth thinks Liam thinks Benjamin thinks the grapes is? +Answer: blue_suitcase +Choices: A. blue_pantry, B. red_crate, C. green_bottle, D. red_bucket, E. blue_suitcase, F. blue_bottle, G. green_basket, H. green_bathtub, I. blue_crate, J. red_bottle, K. green_pantry, L. green_envelope, M. green_drawer, N. red_drawer, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: K. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_12/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..54449524079c386e46fab8a884a4d1a1cd9153df --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_12/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where is the spinach really? +Answer: green_envelope +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: L. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_12/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2a755f20639bad124bcd3da3c75e8d518657384b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_12/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Avery really think the spinach is? +Answer: blue_container +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: L. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_12/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3bf58248942a5fcc22c9b27d5661df6dcf60fefe --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_12/order_2.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Jackson think Avery thinks the spinach is? +Answer: blue_container +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: L. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_12/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..05dd171e8a41ea25d509168289a749bae1d46b11 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_12/order_3.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Isabella think Jackson thinks Avery thinks the spinach is? +Answer: blue_container +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: L. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_12/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..25fb1986712f24180d650d017f0d56ee43dbc3a6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_12/order_4.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella saw a monkey. +2 Mila, Nathan, Avery, Isabella and Jackson entered the kitchen. +3 The spinach is in the green_envelope. +4 Mila moved the spinach to the blue_container. +5 Mila exited the kitchen. +6 Nathan made no movements and stayed in the kitchen for 1 minute. +7 Nathan exited the kitchen. +8 Avery made no movements and stayed in the kitchen for 1 minute. +9 Avery exited the kitchen. +10 Isabella made no movements and stayed in the kitchen for 1 minute. +11 Isabella exited the kitchen. +12 Jackson moved the spinach to the green_envelope. +13 Jackson exited the kitchen. +14 Mila, Nathan, Avery, Isabella and Jackson entered the waiting_room. +15 Jackson, Avery and Mila entered the pantry. +16 The pear is in the green_bottle. +17 Jackson made no movements and stayed in the pantry for 1 minute. +18 Isabella likes the blue_container. +19 Jackson exited the pantry. +20 Avery moved the pear to the green_bucket. +21 Avery exited the pantry. +22 Mila moved the pear to the blue_crate. +23 Mila exited the pantry. +24 Jackson, Avery and Mila entered the waiting_room. +25 Avery privately told Mila that the pear is in the green_bottle. +26 Mila privately told Isabella that the pear is in the blue_crate. +Question: Where does Nathan think Isabella thinks Jackson thinks Avery thinks the spinach is? +Answer: blue_container +Choices: A. green_bottle, B. blue_crate, C. blue_pantry, D. green_bucket, E. blue_bucket, F. green_pantry, G. red_drawer, H. red_container, I. red_crate, J. blue_treasure_chest, K. blue_drawer, L. green_envelope, M. blue_bottle, N. green_basket, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: L. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_13/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..aeb3d4dbcd2fa5396b498e9c29c1a365f3e56b81 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_13/order_0.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where is the watermelon really? +Answer: red_container +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: M. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_13/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..83f3d8649f7138e4d47e15b0af72113b0116f524 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_13/order_1.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Jacob really think the watermelon is? +Answer: red_basket +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: M. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_13/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f74f31587dbb30c116fe254aa8189c18ea83fbd8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_13/order_2.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Isla think Jacob thinks the watermelon is? +Answer: red_basket +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: M. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_13/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d84ee070d76ba0b47efc30ca0f75f851f960991d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_13/order_3.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Logan think Isla thinks Jacob thinks the watermelon is? +Answer: red_container +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: M. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_13/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..702581e200c264cf991044e30dd47a3cfd971586 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_13/order_4.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, William, Jacob, Sophia and Isla entered the front_yard. +2 The watermelon is in the red_container. +3 Logan made no movements and stayed in the front_yard for 1 minute. +4 Sophia lost his phone. +5 Logan exited the front_yard. +6 Isla saw a dog. +7 William made no movements and stayed in the front_yard for 1 minute. +8 William exited the front_yard. +9 Jacob moved the watermelon to the red_basket. +10 Jacob exited the front_yard. +11 Sophia made no movements and stayed in the front_yard for 1 minute. +12 Sophia exited the front_yard. +13 Isla moved the watermelon to the red_container. +14 Isla exited the front_yard. +15 Logan, William, Jacob, Sophia and Isla entered the waiting_room. +16 Logan, William and Jacob entered the hall. +17 The eggplant is in the blue_container. +18 Logan made no movements and stayed in the hall for 1 minute. +19 Logan exited the hall. +20 Sophia dislikes the potato. +21 William moved the eggplant to the red_pantry. +22 William exited the hall. +23 Jacob made no movements and stayed in the hall for 1 minute. +24 Jacob exited the hall. +25 Logan, William and Jacob entered the waiting_room. +26 Logan saw a monkey. +27 Logan publicly claimed that eggplant is in the red_box. +28 Jacob privately told Isla that the eggplant is in the red_pantry. +Question: Where does Sophia think Logan thinks Isla thinks Jacob thinks the watermelon is? +Answer: red_container +Choices: A. red_container, B. blue_pantry, C. blue_bathtub, D. red_basket, E. green_box, F. green_treasure_chest, G. red_envelope, H. red_bucket, I. green_pantry, J. green_bottle, K. blue_container, L. red_box, M. red_pantry, N. green_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: M. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_14/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..67d17567671add8098df0208542349c73eead913 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_14/order_0.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where is the pear really? +Answer: blue_pantry +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_14/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fa2a843cda67f62673840c337815032c716e5863 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_14/order_1.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Nathan really think the pear is? +Answer: blue_pantry +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_14/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..af773c1b7acefe98000a5d8d1d11166740d898f6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_14/order_2.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Amelia think Nathan thinks the pear is? +Answer: green_bucket +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_14/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cfe83fce83fcfdc6a175b2f20032c1c2a5cbebc3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_14/order_3.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Isabella think Amelia thinks Nathan thinks the pear is? +Answer: blue_pantry +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_14/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4f502680024d324b321b8b26bc6d711a6d8ed60a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_14/order_4.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Owen, Amelia, Aiden and Nathan entered the sunroom. +2 The pear is in the blue_pantry. +3 Isabella made no movements and stayed in the sunroom for 1 minute. +4 Isabella exited the sunroom. +5 Owen made no movements and stayed in the sunroom for 1 minute. +6 Owen exited the sunroom. +7 Isabella saw a mouse. +8 Amelia moved the pear to the green_bucket. +9 Amelia exited the sunroom. +10 Aiden moved the pear to the blue_suitcase. +11 Isabella lost his gloves. +12 Aiden exited the sunroom. +13 Nathan moved the pear to the blue_pantry. +14 Owen likes the green_cupboard. +15 Nathan exited the sunroom. +16 Isabella, Owen, Amelia, Aiden and Nathan entered the waiting_room. +17 Nathan, Amelia and Isabella entered the study. +18 The cherry is in the red_basket. +19 Nathan moved the cherry to the red_container. +20 Nathan exited the study. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the study. +23 Isabella made no movements and stayed in the study for 1 minute. +24 Isabella exited the study. +25 Nathan, Amelia and Isabella entered the waiting_room. +26 Amelia publicly claimed that cherry is in the red_envelope. +27 Isabella privately told Amelia that the cherry is in the blue_crate. +Question: Where does Owen think Isabella thinks Amelia thinks Nathan thinks the pear is? +Answer: blue_pantry +Choices: A. red_basket, B. blue_crate, C. green_bathtub, D. red_envelope, E. red_container, F. blue_drawer, G. green_cupboard, H. blue_container, I. green_envelope, J. red_box, K. green_bucket, L. blue_pantry, M. blue_cupboard, N. red_bottle, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_15/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e3340ee884104a9aa6b4a0155707edcbebfdf5a2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_15/order_0.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where is the potato really? +Answer: blue_crate +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: D. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_15/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..03f4320d3a7e463db408e2e8e324e352b4f8e9d7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_15/order_1.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Charlotte really think the potato is? +Answer: blue_cupboard +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: A. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_15/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6af5a1861cd3420f0c9594e0aad05f0db8ad27f8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_15/order_2.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Noah think Charlotte thinks the potato is? +Answer: blue_cupboard +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: A. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_15/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7c4b069e80cc515535b91ac685f11d2077ab1439 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_15/order_3.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Ava think Noah thinks Charlotte thinks the potato is? +Answer: blue_cupboard +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: D. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_15/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7ecea4f5cb4ab1635f4f037e76b0600910aba9ab --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_15/order_4.txt @@ -0,0 +1,40 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Charlotte likes the blue_treasure_chest. +2 Chloe, Charlotte, Ava, Nathan and Noah entered the garden. +3 The potato is in the blue_cupboard. +4 Chloe moved the potato to the green_bottle. +5 Charlotte likes the green_bathtub. +6 Chloe exited the garden. +7 Charlotte made no movements and stayed in the garden for 1 minute. +8 Charlotte exited the garden. +9 Chloe saw a cat. +10 Ava made no movements and stayed in the garden for 1 minute. +11 Ava exited the garden. +12 Chloe likes the green_bottle. +13 Nathan moved the potato to the blue_bathtub. +14 Nathan exited the garden. +15 Noah moved the potato to the blue_cupboard. +16 Noah exited the garden. +17 Chloe, Charlotte, Ava, Nathan and Noah entered the waiting_room. +18 Charlotte, Ava and Nathan entered the garden. +19 The potato is in the blue_cupboard. +20 Charlotte made no movements and stayed in the garden for 1 minute. +21 Charlotte exited the garden. +22 Ava made no movements and stayed in the garden for 1 minute. +23 Ava exited the garden. +24 Noah dislikes the cherry. +25 Nathan moved the potato to the blue_crate. +26 Nathan exited the garden. +27 Charlotte, Ava and Nathan entered the waiting_room. +28 Ava likes the red_bucket. +29 Charlotte publicly claimed that potato is in the blue_cupboard. +30 Charlotte likes the green_bucket. +31 Nathan privately told Noah that the potato is in the blue_crate. +Question: Where does Nathan think Ava thinks Noah thinks Charlotte thinks the potato is? +Answer: blue_cupboard +Choices: A. blue_cupboard, B. green_bottle, C. green_bathtub, D. blue_crate, E. blue_bathtub, F. red_bucket, G. blue_treasure_chest, H. blue_bucket, I. green_bucket, J. red_envelope, K. green_basket, L. red_pantry, M. red_box, N. green_cupboard, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: D. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_16/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4b194e44893e66c37be83ab2016b4c39138462bd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_16/order_0.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where is the cucumber really? +Answer: red_basket +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_16/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0c6a6ed7b911626f9218c31bf62976e9f64a2b94 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_16/order_1.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Benjamin really think the cucumber is? +Answer: red_container +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: C. red_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_16/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7bb679a480aac3306e1470b0d616d18f90b0bae4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_16/order_2.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Charlotte think Benjamin thinks the cucumber is? +Answer: red_container +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: C. red_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_16/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5ac238a32bf332a8254dfbdc43c3c47e0f2607e6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_16/order_3.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Evelyn think Charlotte thinks Benjamin thinks the cucumber is? +Answer: red_container +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_16/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..efbdc40a84f85d83e2b7d479c3eb39d23feed41c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_16/order_4.txt @@ -0,0 +1,37 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Charlotte, Isla, Ava and Evelyn entered the workshop. +2 Benjamin dislikes the asparagus. +3 The cucumber is in the green_crate. +4 Isla likes the blue_bucket. +5 Benjamin moved the cucumber to the red_container. +6 Benjamin exited the workshop. +7 Charlotte moved the cucumber to the red_basket. +8 Charlotte exited the workshop. +9 Isla made no movements and stayed in the workshop for 1 minute. +10 Isla exited the workshop. +11 Ava made no movements and stayed in the workshop for 1 minute. +12 Ava exited the workshop. +13 Evelyn made no movements and stayed in the workshop for 1 minute. +14 Evelyn exited the workshop. +15 Benjamin, Charlotte, Isla, Ava and Evelyn entered the waiting_room. +16 Charlotte, Isla and Evelyn entered the lounge. +17 The orange is in the green_bottle. +18 Ava likes the blue_treasure_chest. +19 Charlotte made no movements and stayed in the lounge for 1 minute. +20 Charlotte exited the lounge. +21 Isla moved the orange to the green_bathtub. +22 Isla exited the lounge. +23 Evelyn moved the orange to the green_bucket. +24 Evelyn exited the lounge. +25 Charlotte, Isla and Evelyn entered the waiting_room. +26 Charlotte publicly claimed that orange is in the green_bottle. +27 Benjamin likes the green_treasure_chest. +28 Evelyn privately told Benjamin that the orange is in the green_bucket. +Question: Where does Isla think Evelyn thinks Charlotte thinks Benjamin thinks the cucumber is? +Answer: red_container +Choices: A. green_crate, B. red_basket, C. red_container, D. red_envelope, E. blue_bucket, F. blue_cupboard, G. blue_bottle, H. blue_treasure_chest, I. blue_suitcase, J. green_pantry, K. green_bucket, L. green_bottle, M. green_cupboard, N. green_treasure_chest, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: L \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_17/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b4f90cd506ae20e128feb2b9e0eb64f1414f76ae --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_17/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where is the cherry really? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: J. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_17/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f0954088e0912e7fb4e6267d0a4630218bfee25 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_17/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Owen really think the cherry is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_17/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9a6e630abf60e79de21a3688a9393c2afea1944d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_17/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Ella think Owen thinks the cherry is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_17/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d3ac9650979e1e076d92de60bc5add83134bedcd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_17/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Abigail think Ella thinks Owen thinks the cherry is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: J. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_17/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..466956290e3587a9638a65db1f6570513ace285f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_17/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Chloe, Owen, Emma, Ella and Abigail entered the staircase. +2 The cherry is in the red_drawer. +3 Chloe moved the cherry to the green_pantry. +4 Chloe exited the staircase. +5 Owen moved the cherry to the green_bucket. +6 Owen exited the staircase. +7 Emma made no movements and stayed in the staircase for 1 minute. +8 Emma exited the staircase. +9 Ella made no movements and stayed in the staircase for 1 minute. +10 Ella exited the staircase. +11 Abigail made no movements and stayed in the staircase for 1 minute. +12 Abigail exited the staircase. +13 Chloe, Owen, Emma, Ella and Abigail entered the waiting_room. +14 Ella, Emma and Chloe entered the patio. +15 The apple is in the blue_drawer. +16 Ella moved the apple to the green_bathtub. +17 Ella exited the patio. +18 Emma moved the apple to the red_crate. +19 Emma exited the patio. +20 Chloe moved the apple to the green_crate. +21 Chloe exited the patio. +22 Ella, Emma and Chloe entered the waiting_room. +23 Owen lost his watch. +24 Ella publicly claimed that apple is in the blue_container. +25 Chloe privately told Owen that the apple is in the green_crate. +Question: Where does Emma think Abigail thinks Ella thinks Owen thinks the cherry is? +Answer: green_bucket +Choices: A. blue_treasure_chest, B. green_basket, C. blue_crate, D. red_pantry, E. red_box, F. blue_drawer, G. blue_container, H. red_crate, I. green_bathtub, J. green_crate, K. green_bucket, L. red_drawer, M. blue_cupboard, N. green_pantry, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: J. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_18/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c00aff4a650a1f3718f7324a277146b7356b3660 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_18/order_0.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where is the sweet_potato really? +Answer: red_container +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: N. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_18/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..bf0d242f1a10e3d142f0e1d5ab1dfd84172fad9a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_18/order_1.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Liam really think the sweet_potato is? +Answer: blue_container +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: M. red_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_18/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8416b7a6aaf6b7580e6d0d0f38ea5af2c0e6bf6e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_18/order_2.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Hannah think Liam thinks the sweet_potato is? +Answer: red_drawer +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: M. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_18/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8e3c9c02b6742f429b47699093d5a724cb4027cf --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_18/order_3.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Evelyn think Hannah thinks Liam thinks the sweet_potato is? +Answer: red_drawer +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: N. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_18/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e6b0f0f86eeb0e35659433ba8b86426649655589 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_18/order_4.txt @@ -0,0 +1,33 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Liam, Hannah, Emma, Mila and Evelyn entered the cellar. +2 The sweet_potato is in the red_drawer. +3 Liam made no movements and stayed in the cellar for 1 minute. +4 Liam exited the cellar. +5 Hannah made no movements and stayed in the cellar for 1 minute. +6 Hannah exited the cellar. +7 Emma made no movements and stayed in the cellar for 1 minute. +8 Emma exited the cellar. +9 Mila moved the sweet_potato to the red_crate. +10 Mila exited the cellar. +11 Evelyn made no movements and stayed in the cellar for 1 minute. +12 Evelyn exited the cellar. +13 Liam, Hannah, Emma, Mila and Evelyn entered the waiting_room. +14 Liam, Mila and Evelyn entered the cellar. +15 The sweet_potato is in the red_crate. +16 Liam made no movements and stayed in the cellar for 1 minute. +17 Liam exited the cellar. +18 Mila moved the sweet_potato to the red_container. +19 Mila exited the cellar. +20 Evelyn made no movements and stayed in the cellar for 1 minute. +21 Evelyn exited the cellar. +22 Liam, Mila and Evelyn entered the waiting_room. +23 Mila publicly claimed that sweet_potato is in the blue_container. +24 Evelyn privately told Mila that the sweet_potato is in the blue_suitcase. +Question: Where does Emma think Evelyn thinks Hannah thinks Liam thinks the sweet_potato is? +Answer: red_drawer +Choices: A. green_bottle, B. blue_treasure_chest, C. green_drawer, D. red_basket, E. blue_crate, F. green_treasure_chest, G. blue_cupboard, H. green_pantry, I. green_cupboard, J. red_bucket, K. blue_container, L. red_drawer, M. red_container, N. blue_suitcase, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: N. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_19/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a619d452ea85d03677f3f70c748a3e5ed0b09855 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_19/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where is the carrot really? +Answer: blue_drawer +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: I. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_19/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0682d9ba3145bf95536ecfe85040670af3296844 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_19/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Benjamin really think the carrot is? +Answer: blue_drawer +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_drawer +GPT-4 Explain: There is no information given about where Benjamin thinks the carrot is, so the answer is unknown. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_19/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..232179c8ce9ee516e488dbf722d45f9090b9a1e1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_19/order_2.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Noah think Benjamin thinks the carrot is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: I. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_19/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6917ab28804e35148db8fb37bd26fba19e452fcb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_19/order_3.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Emily think Noah thinks Benjamin thinks the carrot is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_19/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..75cb354204f70f2eb04a2ab59b59ea4d2a29f3e4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_19/order_4.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Noah, Jack, Benjamin, Emily and Sophia entered the pantry. +2 The carrot is in the green_treasure_chest. +3 Noah moved the carrot to the blue_suitcase. +4 Noah exited the pantry. +5 Jack made no movements and stayed in the pantry for 1 minute. +6 Jack exited the pantry. +7 Benjamin made no movements and stayed in the pantry for 1 minute. +8 Benjamin exited the pantry. +9 Emily moved the carrot to the blue_drawer. +10 Noah dislikes the corn. +11 Emily exited the pantry. +12 Sophia made no movements and stayed in the pantry for 1 minute. +13 Sophia exited the pantry. +14 Noah, Jack, Benjamin, Emily and Sophia entered the waiting_room. +15 Benjamin, Noah and Emily entered the pantry. +16 The beans is in the blue_bottle. +17 Benjamin moved the beans to the blue_drawer. +18 Benjamin exited the pantry. +19 Noah made no movements and stayed in the pantry for 1 minute. +20 Jack likes the red_basket. +21 Noah exited the pantry. +22 Emily made no movements and stayed in the pantry for 1 minute. +23 Emily exited the pantry. +24 Benjamin, Noah and Emily entered the waiting_room. +25 Benjamin publicly claimed that beans is in the blue_bottle. +26 Emily privately told Sophia that the beans is in the blue_drawer. +Question: Where does Sophia think Emily thinks Noah thinks Benjamin thinks the carrot is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. blue_cupboard, D. red_container, E. red_basket, F. blue_bottle, G. green_treasure_chest, H. blue_treasure_chest, I. blue_drawer, J. blue_suitcase, K. green_bathtub, L. blue_bathtub, M. green_envelope, N. red_bottle, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: I. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_2/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..feeda5c3dc9a8a12acd1f07b14dee0a203cb689b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_2/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where is the onion really? +Answer: blue_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: O. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_2/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..3007be454229a1978a06ad20bc23f36191bdf7e6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_2/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Owen really think the onion is? +Answer: blue_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: M. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_2/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..61849d5a2d41150105fde3b0bc70d434f535a433 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_2/order_2.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Emily think Owen thinks the onion is? +Answer: blue_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: M. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_2/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a1e22807a62feb74ff1a0bc89153e5d507ca2aec --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_2/order_3.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Isabella think Emily thinks Owen thinks the onion is? +Answer: red_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: K. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_2/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e1b1b2d1a7982beb68709c3767255ee4c84507e6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_2/order_4.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila, Isabella, Owen, Emily and Sophia entered the porch. +2 The onion is in the red_crate. +3 Mila made no movements and stayed in the porch for 1 minute. +4 Mila exited the porch. +5 Isabella made no movements and stayed in the porch for 1 minute. +6 Isabella exited the porch. +7 Owen moved the onion to the red_drawer. +8 Owen exited the porch. +9 Emily moved the onion to the red_bottle. +10 Emily exited the porch. +11 Sophia moved the onion to the red_crate. +12 Isabella lost his phone. +13 Sophia exited the porch. +14 Mila, Isabella, Owen, Emily and Sophia entered the waiting_room. +15 Isabella, Mila and Owen entered the porch. +16 The onion is in the red_crate. +17 Isabella moved the onion to the blue_crate. +18 Isabella exited the porch. +19 Sophia dislikes the onion. +20 Mila made no movements and stayed in the porch for 1 minute. +21 Mila exited the porch. +22 Owen made no movements and stayed in the porch for 1 minute. +23 Owen exited the porch. +24 Isabella, Mila and Owen entered the waiting_room. +25 Isabella publicly claimed that onion is in the green_cupboard. +26 Owen privately told Emily that the onion is in the blue_crate. +Question: Where does Sophia think Isabella thinks Emily thinks Owen thinks the onion is? +Answer: red_crate +Choices: A. green_bathtub, B. red_bucket, C. green_drawer, D. blue_bottle, E. green_treasure_chest, F. green_box, G. green_basket, H. blue_suitcase, I. green_envelope, J. red_basket, K. green_cupboard, L. red_crate, M. red_bottle, N. red_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: K. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_20/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9e6cf6e9b3b7c80bf7951b04228026165113c1e6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_20/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where is the melon really? +Answer: blue_treasure_chest +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: M. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_20/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..55a9108133a8fa5fd4a04a35086d6313468228bd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_20/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Jacob really think the melon is? +Answer: green_drawer +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: M. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_20/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..fe7cdfdc4fb4b6a9c537f72bf442d29bcc80742f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_20/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Lily think Jacob thinks the melon is? +Answer: blue_treasure_chest +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: B. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_20/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..54d87b5a2486be75541f7cec710db25f23a09c0b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_20/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Evelyn think Lily thinks Jacob thinks the melon is? +Answer: blue_treasure_chest +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: B. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_20/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d4903e882941a4ab9ccd5a62a70e1b2795620528 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_20/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Lily, Amelia, Jacob, Evelyn and Ava entered the garden. +2 The melon is in the blue_treasure_chest. +3 Lily made no movements and stayed in the garden for 1 minute. +4 Lily exited the garden. +5 Amelia moved the melon to the green_bucket. +6 Amelia exited the garden. +7 Jacob moved the melon to the green_drawer. +8 Jacob exited the garden. +9 Evelyn moved the melon to the green_bottle. +10 Evelyn exited the garden. +11 Ava moved the melon to the blue_treasure_chest. +12 Ava exited the garden. +13 Lily, Amelia, Jacob, Evelyn and Ava entered the waiting_room. +14 Jacob saw a cat. +15 Lily, Jacob and Amelia entered the dining_room. +16 The cherry is in the green_treasure_chest. +17 Lily moved the cherry to the red_box. +18 Lily exited the dining_room. +19 Jacob moved the cherry to the blue_bottle. +20 Jacob exited the dining_room. +21 Amelia moved the cherry to the red_envelope. +22 Amelia exited the dining_room. +23 Lily, Jacob and Amelia entered the waiting_room. +24 Jacob publicly claimed that cherry is in the red_box. +25 Amelia privately told Jacob that the cherry is in the red_envelope. +Question: Where does Ava think Evelyn thinks Lily thinks Jacob thinks the melon is? +Answer: blue_treasure_chest +Choices: A. green_bottle, B. blue_treasure_chest, C. blue_bucket, D. green_bucket, E. green_drawer, F. green_envelope, G. red_basket, H. green_crate, I. green_bathtub, J. blue_suitcase, K. red_box, L. green_treasure_chest, M. red_envelope, N. blue_container, O. blue_bottle + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: B. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_3/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..030d4bb7b1c47a52d32366d1c7b1bd369ed3b743 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_3/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where is the peas really? +Answer: red_pantry +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: B. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_3/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc02efd05e97564e880b8105530d4a62ed414c3a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_3/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Emma really think the peas is? +Answer: red_pantry +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: A. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_3/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3d6ff4e48a0d9dd6ce002e83ab2a06b8ac771e2c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_3/order_2.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Hannah think Emma thinks the peas is? +Answer: blue_treasure_chest +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: E. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_3/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b108a1910669afbb62686bde99270ec5455bc508 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_3/order_3.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Chloe think Hannah thinks Emma thinks the peas is? +Answer: blue_treasure_chest +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: E. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_3/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8c2d7d7148c8ef9a065fbeda801187f0f2af9f8a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_3/order_4.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Emma, Isabella, Hannah and Chloe entered the hallway. +2 The peas is in the red_bottle. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Emma made no movements and stayed in the hallway for 1 minute. +6 Emma exited the hallway. +7 Isabella moved the peas to the green_bottle. +8 Isabella exited the hallway. +9 Hannah moved the peas to the blue_treasure_chest. +10 Isabella dislikes the tangerine. +11 Hannah exited the hallway. +12 Chloe moved the peas to the red_bottle. +13 Chloe lost his phone. +14 Chloe exited the hallway. +15 Logan, Emma, Isabella, Hannah and Chloe entered the waiting_room. +16 Isabella, Logan and Emma entered the hallway. +17 The peas is in the red_bottle. +18 Isabella moved the peas to the blue_treasure_chest. +19 Isabella exited the hallway. +20 Logan moved the peas to the blue_bathtub. +21 Logan exited the hallway. +22 Emma moved the peas to the red_pantry. +23 Emma exited the hallway. +24 Isabella, Logan and Emma entered the waiting_room. +25 Logan publicly claimed that peas is in the green_bottle. +26 Emma privately told Logan that the peas is in the red_bottle. +Question: Where does Logan think Chloe thinks Hannah thinks Emma thinks the peas is? +Answer: blue_treasure_chest +Choices: A. red_bottle, B. red_pantry, C. green_bottle, D. blue_bathtub, E. blue_treasure_chest, F. green_box, G. green_cupboard, H. green_crate, I. green_drawer, J. red_drawer, K. green_treasure_chest, L. blue_drawer, M. blue_cupboard, N. blue_container, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: E. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_4/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a0acc827dd53eb63947557fc22fe79dd1ccf283b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_4/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where is the cherry really? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: H. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_4/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..26d4b4c35757e955d19978168f3e2dc61d5327f5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_4/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does Nathan really think the cherry is? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: G. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_4/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..299e964cdef346861497d87a30e8ffeab92e29fa --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_4/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does William think Nathan thinks the cherry is? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: G. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_4/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..359245df614b08d8fa9108bce9befc7213abcfba --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_4/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does Ava think William thinks Nathan thinks the cherry is? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: C. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_4/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7d8ca491592a5e8c303345f62cec0c948dffdafc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_4/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emma, William, Isla, Ava and Nathan entered the sunroom. +2 The cherry is in the blue_suitcase. +3 Emma made no movements and stayed in the sunroom for 1 minute. +4 Emma exited the sunroom. +5 William made no movements and stayed in the sunroom for 1 minute. +6 William exited the sunroom. +7 Isla moved the cherry to the red_bottle. +8 Isla exited the sunroom. +9 Ava moved the cherry to the green_basket. +10 Ava exited the sunroom. +11 Nathan moved the cherry to the blue_suitcase. +12 William saw a cat. +13 Nathan exited the sunroom. +14 Emma, William, Isla, Ava and Nathan entered the waiting_room. +15 Emma, Ava and Isla entered the laundry. +16 The sweet_potato is in the green_drawer. +17 Emma moved the sweet_potato to the green_cupboard. +18 Emma exited the laundry. +19 Ava moved the sweet_potato to the blue_cupboard. +20 Ava exited the laundry. +21 Isla moved the sweet_potato to the green_bathtub. +22 Isla exited the laundry. +23 Emma, Ava and Isla entered the waiting_room. +24 Ava privately told Isla that the sweet_potato is in the green_drawer. +25 Isla privately told William that the sweet_potato is in the green_bathtub. +Question: Where does Emma think Ava thinks William thinks Nathan thinks the cherry is? +Answer: blue_suitcase +Choices: A. green_drawer, B. green_treasure_chest, C. blue_cupboard, D. green_bathtub, E. green_cupboard, F. red_envelope, G. blue_suitcase, H. green_bottle, I. red_bottle, J. green_basket, K. red_container, L. green_crate, M. blue_drawer, N. red_drawer, O. red_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: E. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_5/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..978c40f48bffe4bcba92a7d77e1d1abf7df3a79e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_5/order_0.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where is the watermelon really? +Answer: blue_container +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: G. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_5/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8866610c7bfbf6b1cde1adadd4e6cc42a75a9179 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_5/order_1.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Benjamin really think the watermelon is? +Answer: green_drawer +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: G. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_5/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..39e83509bef081e02dfeab68b369f0618d129236 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_5/order_2.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Emma think Benjamin thinks the watermelon is? +Answer: green_drawer +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: H. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_5/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..fa90d233bfa6a0457b5c26f20a9799afb60c3dcb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_5/order_3.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Isabella think Emma thinks Benjamin thinks the watermelon is? +Answer: green_drawer +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: G. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_5/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..fc422da60a27580989fdf9720fdcd5673c894622 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_5/order_4.txt @@ -0,0 +1,38 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Emma, Charlotte and Liam entered the workshop. +2 Liam lost his phone. +3 The watermelon is in the blue_bottle. +4 Benjamin moved the watermelon to the green_drawer. +5 Benjamin exited the workshop. +6 Isabella moved the watermelon to the blue_bucket. +7 Benjamin dislikes the lime. +8 Isabella exited the workshop. +9 Emma made no movements and stayed in the workshop for 1 minute. +10 Emma exited the workshop. +11 Charlotte moved the watermelon to the blue_container. +12 Charlotte exited the workshop. +13 Liam made no movements and stayed in the workshop for 1 minute. +14 Liam exited the workshop. +15 Benjamin likes the blue_bottle. +16 Benjamin, Isabella, Emma, Charlotte and Liam entered the waiting_room. +17 Charlotte, Liam and Isabella entered the lounge. +18 The green_pepper is in the red_bottle. +19 Charlotte likes the green_envelope. +20 Charlotte moved the green_pepper to the green_envelope. +21 Charlotte exited the lounge. +22 Liam moved the green_pepper to the red_drawer. +23 Liam exited the lounge. +24 Isabella moved the green_pepper to the red_box. +25 Isabella exited the lounge. +26 Charlotte, Liam and Isabella entered the waiting_room. +27 Liam likes the blue_bucket. +28 Liam privately told Isabella that the green_pepper is in the red_bottle. +29 Isabella privately told Benjamin that the green_pepper is in the red_box. +Question: Where does Liam think Isabella thinks Emma thinks Benjamin thinks the watermelon is? +Answer: green_drawer +Choices: A. red_bottle, B. green_envelope, C. red_box, D. red_drawer, E. blue_suitcase, F. blue_container, G. blue_bottle, H. green_drawer, I. blue_bucket, J. red_container, K. blue_drawer, L. green_bottle, M. red_pantry, N. blue_cupboard, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_drawer +GPT-4 Explain: H. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_6/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..28a92f1d337f0345d28c3f8acc0179a8a07317a4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_6/order_0.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where is the peach really? +Answer: red_basket +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: L. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_6/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..813019a7421e8a3896040a12f03ae091b9b9405b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_6/order_1.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does Chloe really think the peach is? +Answer: green_bathtub +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: L. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_6/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f8c17aa37b1632faac354993f19693452b90feb8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_6/order_2.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does Isabella think Chloe thinks the peach is? +Answer: red_basket +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: L. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_6/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..59c6c57ca98e63703afe89b7e2daa16998568979 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_6/order_3.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does Nathan think Isabella thinks Chloe thinks the peach is? +Answer: red_basket +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: L. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_6/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0ce1463b889b0f251a9d17babe2e33a8a132e944 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_6/order_4.txt @@ -0,0 +1,35 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Isabella, William, Chloe and Elizabeth entered the basement. +2 The peach is in the red_basket. +3 Nathan made no movements and stayed in the basement for 1 minute. +4 Nathan exited the basement. +5 Isabella made no movements and stayed in the basement for 1 minute. +6 Isabella exited the basement. +7 William moved the peach to the green_bathtub. +8 William exited the basement. +9 Chloe made no movements and stayed in the basement for 1 minute. +10 Chloe exited the basement. +11 Elizabeth moved the peach to the red_basket. +12 Elizabeth exited the basement. +13 Nathan, Isabella, William, Chloe and Elizabeth entered the waiting_room. +14 Isabella, Elizabeth and William entered the workshop. +15 The beans is in the green_drawer. +16 Isabella moved the beans to the red_box. +17 Isabella exited the workshop. +18 Elizabeth moved the beans to the blue_bucket. +19 Elizabeth exited the workshop. +20 William moved the beans to the red_bucket. +21 Elizabeth dislikes the plum. +22 William exited the workshop. +23 Isabella, Elizabeth and William entered the waiting_room. +24 Isabella lost his phone. +25 William publicly claimed that beans is in the green_drawer. +26 Isabella privately told William that the beans is in the red_box. +Question: Where does William think Nathan thinks Isabella thinks Chloe thinks the peach is? +Answer: red_basket +Choices: A. green_bucket, B. blue_bottle, C. blue_drawer, D. blue_bathtub, E. green_bottle, F. green_drawer, G. red_bucket, H. red_envelope, I. red_box, J. blue_bucket, K. green_cupboard, L. red_basket, M. green_basket, N. green_box, O. green_bathtub + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_basket +GPT-4 Explain: L. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_7/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..069edd39a6cbe2ea9c5b286af1eab62e70a14ca4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_7/order_0.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where is the asparagus really? +Answer: green_treasure_chest +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: H. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_7/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad76be783515b9780184bbbe5fa01cc2d70d86a7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_7/order_1.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Aiden really think the asparagus is? +Answer: green_treasure_chest +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: H. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_7/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b2ed258e67289fcd4b61b69b74360945ec76d6b7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_7/order_2.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Emily think Aiden thinks the asparagus is? +Answer: green_treasure_chest +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: H. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_7/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..54ce6d890094ca4e3b8b7f69255a0fefe18bc6c8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_7/order_3.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Avery think Emily thinks Aiden thinks the asparagus is? +Answer: green_treasure_chest +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: H. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_7/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..84b5575a1a43e19da22153cc484ba26fdebadda9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_7/order_4.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Owen, Emily, Aiden and Avery entered the hall. +2 The asparagus is in the green_cupboard. +3 Hannah lost his phone. +4 Hannah moved the asparagus to the green_treasure_chest. +5 Hannah exited the hall. +6 Owen made no movements and stayed in the hall for 1 minute. +7 Owen exited the hall. +8 Emily made no movements and stayed in the hall for 1 minute. +9 Emily exited the hall. +10 Aiden made no movements and stayed in the hall for 1 minute. +11 Aiden exited the hall. +12 Owen likes the green_basket. +13 Avery made no movements and stayed in the hall for 1 minute. +14 Avery exited the hall. +15 Hannah, Owen, Emily, Aiden and Avery entered the waiting_room. +16 Hannah, Owen and Aiden entered the bathroom. +17 The carrot is in the blue_crate. +18 Emily likes the red_crate. +19 Hannah moved the carrot to the green_drawer. +20 Hannah exited the bathroom. +21 Owen moved the carrot to the green_basket. +22 Owen exited the bathroom. +23 Aiden made no movements and stayed in the bathroom for 1 minute. +24 Aiden exited the bathroom. +25 Hannah, Owen and Aiden entered the waiting_room. +26 Hannah publicly claimed that carrot is in the blue_crate. +27 Aiden privately told Emily that the carrot is in the green_basket. +Question: Where does Hannah think Avery thinks Emily thinks Aiden thinks the asparagus is? +Answer: green_treasure_chest +Choices: A. green_cupboard, B. green_treasure_chest, C. green_bucket, D. red_envelope, E. green_bathtub, F. blue_crate, G. green_drawer, H. green_basket, I. green_envelope, J. blue_container, K. red_drawer, L. green_crate, M. red_crate, N. blue_cupboard, O. blue_suitcase + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: Hannah thinks Avery thinks Emily thinks Aiden thinks the asparagus is in the green_treasure_chest. (B) \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_8/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..594341e6dfaf0469b8bbcf65f93f84b4f91a4cdd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_8/order_0.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where is the lettuce really? +Answer: green_pantry +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: J. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_8/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..22c2047e7eb339e3d6844cd14ffb5f70e7e4ac09 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_8/order_1.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Isla really think the lettuce is? +Answer: green_pantry +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: J. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_8/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6439b09ecd07eb3c5b957d48333ec760b1db53bc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_8/order_2.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Charlotte think Isla thinks the lettuce is? +Answer: blue_bathtub +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bathtub +GPT-4 Explain: I. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_8/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1a4dce127dfd8921636cc4c072287dfbe3caaad4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_8/order_3.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Amelia think Charlotte thinks Isla thinks the lettuce is? +Answer: blue_cupboard +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: J. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_8/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c47206c0b783077f3286006f3c766dc183ceee59 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_8/order_4.txt @@ -0,0 +1,36 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 William, Amelia, Charlotte, Aiden and Isla entered the living_room. +2 The lettuce is in the green_pantry. +3 William moved the lettuce to the blue_cupboard. +4 William exited the living_room. +5 Amelia made no movements and stayed in the living_room for 1 minute. +6 Amelia exited the living_room. +7 Charlotte moved the lettuce to the blue_bathtub. +8 Charlotte exited the living_room. +9 Aiden moved the lettuce to the red_box. +10 Aiden exited the living_room. +11 Isla moved the lettuce to the green_pantry. +12 Isla exited the living_room. +13 William, Amelia, Charlotte, Aiden and Isla entered the waiting_room. +14 Charlotte, William and Amelia entered the sunroom. +15 The apple is in the red_bucket. +16 Charlotte moved the apple to the blue_container. +17 Charlotte exited the sunroom. +18 Charlotte dislikes the grapes. +19 William made no movements and stayed in the sunroom for 1 minute. +20 William exited the sunroom. +21 Charlotte dislikes the potato. +22 Amelia made no movements and stayed in the sunroom for 1 minute. +23 Amelia exited the sunroom. +24 Charlotte, William and Amelia entered the waiting_room. +25 William publicly claimed that apple is in the blue_container. +26 William dislikes the apple. +27 Amelia privately told William that the apple is in the blue_suitcase. +Question: Where does Aiden think Amelia thinks Charlotte thinks Isla thinks the lettuce is? +Answer: blue_cupboard +Choices: A. green_pantry, B. red_basket, C. blue_cupboard, D. red_box, E. blue_bathtub, F. red_bucket, G. red_envelope, H. red_bottle, I. blue_suitcase, J. blue_container, K. red_pantry, L. green_cupboard, M. red_crate, N. blue_drawer, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: J. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_9/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9ae7faef575306d15cb0f2206642d11755dc40ac --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_9/order_0.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where is the apple really? +Answer: green_bottle +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_9/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..28eb0fdc7328694580780b5aa98e43e8b918ba8c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_9/order_1.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Jack really think the apple is? +Answer: green_bottle +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_9/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..844b8e47251f298c2d371055bb2e1a85052fa2c4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_9/order_2.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Evelyn think Jack thinks the apple is? +Answer: green_bottle +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_9/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..0f0c943021c67d1b097953e146955b1351567967 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_9/order_3.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Ella think Evelyn thinks Jack thinks the apple is? +Answer: green_pantry +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: N. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_9/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..35aac197667d352b714274549d2bc543c0b5a5c0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_2/sample_9/order_4.txt @@ -0,0 +1,34 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella, Amelia, Jack, Evelyn and Hannah entered the den. +2 The apple is in the green_pantry. +3 Ella made no movements and stayed in the den for 1 minute. +4 Ella exited the den. +5 Amelia made no movements and stayed in the den for 1 minute. +6 Amelia exited the den. +7 Jack moved the apple to the green_bottle. +8 Jack exited the den. +9 Evelyn made no movements and stayed in the den for 1 minute. +10 Evelyn exited the den. +11 Hannah made no movements and stayed in the den for 1 minute. +12 Hannah exited the den. +13 Ella, Amelia, Jack, Evelyn and Hannah entered the waiting_room. +14 Amelia, Ella and Evelyn entered the sunroom. +15 The onion is in the red_drawer. +16 Amelia made no movements and stayed in the sunroom for 1 minute. +17 Amelia exited the sunroom. +18 Ella moved the onion to the red_pantry. +19 Ella likes the green_bucket. +20 Ella exited the sunroom. +21 Evelyn made no movements and stayed in the sunroom for 1 minute. +22 Evelyn exited the sunroom. +23 Amelia, Ella and Evelyn entered the waiting_room. +24 Ella publicly claimed that onion is in the green_treasure_chest. +25 Evelyn privately told Ella that the onion is in the red_pantry. +Question: Where does Amelia think Ella thinks Evelyn thinks Jack thinks the apple is? +Answer: green_pantry +Choices: A. green_pantry, B. red_bottle, C. red_box, D. green_bottle, E. green_crate, F. red_container, G. blue_suitcase, H. blue_cupboard, I. blue_container, J. green_box, K. green_bucket, L. red_drawer, M. green_envelope, N. green_treasure_chest, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_1/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9d75a016cd480002fce1cab5db74afde5a9223e7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_1/order_0.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where is the peas really? +Answer: green_bottle +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: I. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_1/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b1ef27ec339678cb82acb169c96f88eafb02bb3d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_1/order_1.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Jack really think the peas is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: I. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_1/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..239f92a766efa30b4727b4b8f92ee99f35b86753 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_1/order_2.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Jackson think Jack thinks the peas is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: I. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_1/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c4f459d5421f475620420622e0cad47c54d43e75 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_1/order_3.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Logan think Jackson thinks Jack thinks the peas is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: I. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_1/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..79be62513744607be3daedd259aa4e8cf1c24726 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_1/order_4.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Logan, Jackson, Jack, Emily and Isabella entered the hallway. +2 The peas is in the blue_suitcase. +3 Logan made no movements and stayed in the hallway for 1 minute. +4 Logan exited the hallway. +5 Jackson made no movements and stayed in the hallway for 1 minute. +6 Jack likes the blue_crate. +7 Jackson exited the hallway. +8 Jack moved the peas to the red_crate. +9 Jack exited the hallway. +10 Emily moved the peas to the green_bottle. +11 Emily exited the hallway. +12 Isabella made no movements and stayed in the hallway for 1 minute. +13 Jackson dislikes the turnip. +14 Isabella exited the hallway. +15 Logan, Jackson, Jack, Emily and Isabella entered the waiting_room. +16 Emily publicly claimed that peas is in the blue_suitcase. +17 Isabella privately told Logan that the peas is in the green_bottle. +18 Isabella, Emily and Logan entered the attic. +19 The potato is in the green_drawer. +20 Isabella moved the potato to the red_basket. +21 Isabella exited the attic. +22 Jackson dislikes the cucumber. +23 Emily moved the potato to the green_bathtub. +24 Emily exited the attic. +25 Logan moved the potato to the blue_crate. +26 Logan exited the attic. +27 Isabella, Emily and Logan entered the waiting_room. +28 Jack, Isabella, Emily and Logan entered the patio. +29 The cherry is in the blue_bottle. +30 Jack made no movements and stayed in the patio for 1 minute. +31 Jack exited the patio. +32 Isabella moved the cherry to the green_envelope. +33 Isabella exited the patio. +34 Emily made no movements and stayed in the patio for 1 minute. +35 Emily exited the patio. +36 Logan moved the cherry to the blue_cupboard. +37 Logan exited the patio. +38 Emily dislikes the peas. +39 Jack, Isabella, Emily and Logan entered the waiting_room. +40 Isabella privately told Emily that the cherry is in the blue_cupboard. +41 Logan privately told Jackson that the cherry is in the blue_cupboard. +Question: Where does Isabella think Logan thinks Jackson thinks Jack thinks the peas is? +Answer: blue_suitcase +Choices: A. blue_crate, B. green_drawer, C. red_basket, D. blue_drawer, E. green_bathtub, F. blue_bottle, G. green_pantry, H. red_envelope, I. blue_cupboard, J. green_envelope, K. red_crate, L. blue_suitcase, M. green_bottle, N. red_bucket, O. red_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: I. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_10/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..29754b1175429729996c1811847df67ae962978f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_10/order_0.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where is the persimmon really? +Answer: green_bathtub +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bathtub +GPT-4 Explain: K. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_10/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..479c69fab25d143c953565051306e9462f21ce11 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_10/order_1.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Mila really think the persimmon is? +Answer: green_bucket +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: N. blue cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_10/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c251f1286add5aef0738f8aa780c60b677925713 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_10/order_2.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Emily think Mila thinks the persimmon is? +Answer: red_envelope +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: N. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_10/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..187bda3efca870748dc5e4134e241fe208e44a39 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_10/order_3.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Charlotte think Emily thinks Mila thinks the persimmon is? +Answer: red_envelope +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: N. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_10/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9ac83373ffcaa8d61dee14c9b628d5ba270c9f47 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_10/order_4.txt @@ -0,0 +1,54 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Emily, Mila, Benjamin, Emma and Charlotte entered the back_yard. +2 Benjamin lost his phone. +3 The persimmon is in the green_bathtub. +4 Mila likes the red_envelope. +5 Emily moved the persimmon to the red_envelope. +6 Emily exited the back_yard. +7 Mila moved the persimmon to the green_box. +8 Emma lost his phone. +9 Mila exited the back_yard. +10 Benjamin moved the persimmon to the red_pantry. +11 Emily saw a dog. +12 Benjamin exited the back_yard. +13 Emma moved the persimmon to the green_bucket. +14 Emma exited the back_yard. +15 Charlotte moved the persimmon to the green_bathtub. +16 Charlotte exited the back_yard. +17 Emily, Mila, Benjamin, Emma and Charlotte entered the waiting_room. +18 Emma publicly claimed that persimmon is in the green_bucket. +19 Charlotte privately told Emily that the persimmon is in the green_bathtub. +20 Charlotte, Emma and Mila entered the garden. +21 The eggplant is in the green_crate. +22 Charlotte made no movements and stayed in the garden for 1 minute. +23 Charlotte exited the garden. +24 Emma made no movements and stayed in the garden for 1 minute. +25 Emma lost his phone. +26 Emma exited the garden. +27 Mila moved the eggplant to the blue_cupboard. +28 Mila exited the garden. +29 Charlotte, Emma and Mila entered the waiting_room. +30 Emma, Charlotte, Benjamin and Emily entered the garden. +31 The apple is in the green_bottle. +32 Emma lost his gloves. +33 Emma made no movements and stayed in the garden for 1 minute. +34 Emma exited the garden. +35 Charlotte made no movements and stayed in the garden for 1 minute. +36 Charlotte saw a cat. +37 Charlotte exited the garden. +38 Benjamin moved the apple to the green_crate. +39 Benjamin exited the garden. +40 Emily made no movements and stayed in the garden for 1 minute. +41 Emily exited the garden. +42 Emma, Charlotte, Benjamin and Emily entered the waiting_room. +43 Charlotte publicly claimed that apple is in the blue_cupboard. +44 Emma saw a monkey. +45 Emily privately told Benjamin that the apple is in the green_bottle. +Question: Where does Benjamin think Charlotte thinks Emily thinks Mila thinks the persimmon is? +Answer: red_envelope +Choices: A. green_bathtub, B. green_bucket, C. green_box, D. red_pantry, E. red_envelope, F. green_cupboard, G. green_envelope, H. blue_bottle, I. green_treasure_chest, J. blue_container, K. green_bottle, L. green_crate, M. red_crate, N. blue_cupboard, O. red_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: N. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_11/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..76ec395c3bcec7cb869b9d6542fa4842174b5aca --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_11/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where is the spinach really? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: F. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_11/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c20aaf7f897ac3210ff57e607608f9b54c2ea608 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_11/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Abigail really think the spinach is? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: F. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_11/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b1f1e8a7fc41537408dd27df4f77012c4dd50de4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_11/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Benjamin think Abigail thinks the spinach is? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: F. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_11/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4d20169c2d237f7a55a4b20144a74c27c2fe6cb5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_11/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Jack think Benjamin thinks Abigail thinks the spinach is? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: F. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_11/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..be32d0fcce4f60c03fcd2c805a79dcede8951464 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_11/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Amelia, Jack, Benjamin and Isla entered the sunroom. +2 The spinach is in the green_pantry. +3 Abigail made no movements and stayed in the sunroom for 1 minute. +4 Abigail exited the sunroom. +5 Amelia made no movements and stayed in the sunroom for 1 minute. +6 Amelia exited the sunroom. +7 Jack made no movements and stayed in the sunroom for 1 minute. +8 Jack exited the sunroom. +9 Benjamin made no movements and stayed in the sunroom for 1 minute. +10 Benjamin exited the sunroom. +11 Abigail dislikes the spinach. +12 Isla moved the spinach to the green_pantry. +13 Isla exited the sunroom. +14 Abigail, Amelia, Jack, Benjamin and Isla entered the waiting_room. +15 Jack publicly claimed that spinach is in the green_pantry. +16 Isla privately told Jack that the spinach is in the blue_suitcase. +17 Abigail, Isla and Jack entered the patio. +18 The persimmon is in the blue_bottle. +19 Abigail made no movements and stayed in the patio for 1 minute. +20 Abigail exited the patio. +21 Isla made no movements and stayed in the patio for 1 minute. +22 Isla exited the patio. +23 Jack moved the persimmon to the green_bottle. +24 Jack exited the patio. +25 Abigail, Isla and Jack entered the waiting_room. +26 Benjamin, Isla, Amelia and Jack entered the front_yard. +27 The tangerine is in the blue_treasure_chest. +28 Benjamin made no movements and stayed in the front_yard for 1 minute. +29 Benjamin exited the front_yard. +30 Isla made no movements and stayed in the front_yard for 1 minute. +31 Isla exited the front_yard. +32 Amelia moved the tangerine to the green_bucket. +33 Amelia exited the front_yard. +34 Jack moved the tangerine to the blue_cupboard. +35 Jack exited the front_yard. +36 Benjamin, Isla, Amelia and Jack entered the waiting_room. +37 Isla publicly claimed that tangerine is in the green_treasure_chest. +38 Jack privately told Amelia that the tangerine is in the green_bucket. +Question: Where does Amelia think Jack thinks Benjamin thinks Abigail thinks the spinach is? +Answer: green_pantry +Choices: A. green_bottle, B. blue_bottle, C. blue_pantry, D. red_pantry, E. blue_bucket, F. green_pantry, G. green_bathtub, H. blue_container, I. green_basket, J. blue_suitcase, K. green_treasure_chest, L. blue_treasure_chest, M. red_envelope, N. blue_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: N. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_12/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e4e4725cf0787cdf4bb0678364a637f49654e8a6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_12/order_0.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where is the spinach really? +Answer: green_pantry +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: L. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_12/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ae3d35ef1d56eb4f37a705e1bf37cc8c8ea76aec --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_12/order_1.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Avery really think the spinach is? +Answer: green_pantry +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: L. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_12/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2d6f64d65f113fe89108b5b647d3f7078f1ace96 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_12/order_2.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Hannah think Avery thinks the spinach is? +Answer: red_crate +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_crate +GPT-4 Explain: Hannah thinks Avery thinks the spinach is in the green_pantry. Answer: L. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_12/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..278f7d5a3f51eb634a9ffb5c02d389a264f1bb5f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_12/order_3.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Isabella think Hannah thinks Avery thinks the spinach is? +Answer: green_pantry +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: M. green_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_12/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c065403bf5427f4973b74291b6b89942a83e3e1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_12/order_4.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Isabella, Avery, Hannah, Noah and Nathan entered the dining_room. +2 The spinach is in the green_pantry. +3 Isabella made no movements and stayed in the dining_room for 1 minute. +4 Isabella exited the dining_room. +5 Avery moved the spinach to the red_crate. +6 Avery exited the dining_room. +7 Hannah moved the spinach to the green_cupboard. +8 Hannah exited the dining_room. +9 Noah made no movements and stayed in the dining_room for 1 minute. +10 Noah exited the dining_room. +11 Nathan moved the spinach to the green_pantry. +12 Nathan exited the dining_room. +13 Isabella, Avery, Hannah, Noah and Nathan entered the waiting_room. +14 Hannah lost his gloves. +15 Hannah privately told Isabella that the spinach is in the green_cupboard. +16 Avery privately told Noah that the spinach is in the green_pantry. +17 Avery, Noah and Hannah entered the garage. +18 Hannah saw a mouse. +19 The onion is in the red_basket. +20 Avery made no movements and stayed in the garage for 1 minute. +21 Avery exited the garage. +22 Noah made no movements and stayed in the garage for 1 minute. +23 Noah exited the garage. +24 Hannah made no movements and stayed in the garage for 1 minute. +25 Hannah exited the garage. +26 Avery, Noah and Hannah entered the waiting_room. +27 Isabella likes the green_basket. +28 Isabella, Nathan, Noah and Avery entered the dining_room. +29 The cherry is in the red_crate. +30 Isabella moved the cherry to the green_pantry. +31 Isabella exited the dining_room. +32 Nathan moved the cherry to the green_box. +33 Nathan exited the dining_room. +34 Noah made no movements and stayed in the dining_room for 1 minute. +35 Noah exited the dining_room. +36 Avery made no movements and stayed in the dining_room for 1 minute. +37 Avery exited the dining_room. +38 Isabella, Nathan, Noah and Avery entered the waiting_room. +39 Isabella publicly claimed that cherry is in the green_pantry. +40 Avery privately told Hannah that the cherry is in the green_box. +Question: Where does Nathan think Isabella thinks Hannah thinks Avery thinks the spinach is? +Answer: green_pantry +Choices: A. red_basket, B. red_container, C. blue_bottle, D. green_basket, E. red_pantry, F. blue_crate, G. green_bathtub, H. blue_pantry, I. blue_container, J. blue_suitcase, K. red_crate, L. green_pantry, M. green_box, N. red_drawer, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: Nathan thinks Isabella thinks Hannah thinks Avery thinks the spinach is in the green_cupboard. Answer: O. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_13/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..116ad51c4fba0af4b27a4a03a2f98cd62ec52ced --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_13/order_0.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where is the onion really? +Answer: green_crate +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: B. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_13/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e1e8f587364bf86c2f51061eca7fd955b47def50 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_13/order_1.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Mila really think the onion is? +Answer: red_bucket +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: B. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_13/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..09b92b939f6bfd6659f74ce7fb3be0b7c5fbcec5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_13/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Abigail think Mila thinks the onion is? +Answer: red_bucket +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: J. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_13/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d14caea00493bf7d6c792ff72070f9f5b86b51c5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_13/order_3.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Jack think Abigail thinks Mila thinks the onion is? +Answer: green_crate +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: J. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_13/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2868991d3298d6de30458e3c1e46dd8bea848e77 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_13/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Mila saw a cat. +2 Jack, Abigail, Emily, Lily and Mila entered the master_bedroom. +3 Emily lost his watch. +4 The onion is in the green_crate. +5 Jack made no movements and stayed in the master_bedroom for 1 minute. +6 Jack exited the master_bedroom. +7 Abigail made no movements and stayed in the master_bedroom for 1 minute. +8 Abigail exited the master_bedroom. +9 Emily made no movements and stayed in the master_bedroom for 1 minute. +10 Emily exited the master_bedroom. +11 Lily moved the onion to the blue_bucket. +12 Lily exited the master_bedroom. +13 Mila made no movements and stayed in the master_bedroom for 1 minute. +14 Mila exited the master_bedroom. +15 Jack, Abigail, Emily, Lily and Mila entered the waiting_room. +16 Lily publicly claimed that onion is in the blue_bucket. +17 Mila privately told Jack that the onion is in the blue_bucket. +18 Mila, Abigail and Emily entered the porch. +19 The pear is in the red_bottle. +20 Mila moved the pear to the green_pantry. +21 Mila exited the porch. +22 Abigail moved the pear to the green_basket. +23 Abigail exited the porch. +24 Emily made no movements and stayed in the porch for 1 minute. +25 Emily exited the porch. +26 Mila, Abigail and Emily entered the waiting_room. +27 Abigail, Lily, Mila and Emily entered the master_bedroom. +28 The onion is in the blue_bucket. +29 Abigail moved the onion to the red_bucket. +30 Abigail exited the master_bedroom. +31 Lily made no movements and stayed in the master_bedroom for 1 minute. +32 Lily exited the master_bedroom. +33 Mila made no movements and stayed in the master_bedroom for 1 minute. +34 Mila exited the master_bedroom. +35 Emily moved the onion to the green_crate. +36 Emily exited the master_bedroom. +37 Abigail, Lily, Mila and Emily entered the waiting_room. +38 Lily privately told Mila that the onion is in the green_crate. +39 Emily privately told Jack that the onion is in the green_crate. +Question: Where does Emily think Jack thinks Abigail thinks Mila thinks the onion is? +Answer: green_crate +Choices: A. blue_bottle, B. green_crate, C. red_bucket, D. blue_bucket, E. red_box, F. red_bottle, G. red_envelope, H. green_bucket, I. green_pantry, J. green_basket, K. blue_pantry, L. green_cupboard, M. blue_drawer, N. red_basket, O. green_drawer + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: D. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_14/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b5c46834da00fa5863c31a87b8c9988b4f723e6a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_14/order_0.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where is the carrot really? +Answer: green_crate +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: N. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_14/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..be38793c16cca0ab16d4c3fd4eb676c75c6a0ed2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_14/order_1.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Abigail really think the carrot is? +Answer: red_drawer +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_drawer +GPT-4 Explain: L. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_14/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..16d3604cdfa41016184b0da8fcc1391d0f888de1 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_14/order_2.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Nathan think Abigail thinks the carrot is? +Answer: red_envelope +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: L. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_14/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8a14f866877bc1a7aa4323d5f76e323a634e42ed --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_14/order_3.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Avery think Nathan thinks Abigail thinks the carrot is? +Answer: red_envelope +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: J. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_14/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..15f1d0db9f4102d11c9fb185740b8b0415560ccb --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_14/order_4.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Emma, Avery, Isabella and Abigail entered the front_yard. +2 Abigail saw a mouse. +3 The carrot is in the red_envelope. +4 Nathan made no movements and stayed in the front_yard for 1 minute. +5 Nathan exited the front_yard. +6 Avery saw a dog. +7 Emma made no movements and stayed in the front_yard for 1 minute. +8 Emma exited the front_yard. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Isabella moved the carrot to the red_container. +12 Isabella exited the front_yard. +13 Abigail moved the carrot to the red_envelope. +14 Abigail exited the front_yard. +15 Nathan, Emma, Avery, Isabella and Abigail entered the waiting_room. +16 Isabella publicly claimed that carrot is in the red_envelope. +17 Abigail privately told Nathan that the carrot is in the red_envelope. +18 Emma, Avery and Abigail entered the lounge. +19 Nathan saw a cat. +20 The eggplant is in the blue_drawer. +21 Emma made no movements and stayed in the lounge for 1 minute. +22 Emma exited the lounge. +23 Avery moved the eggplant to the blue_pantry. +24 Avery exited the lounge. +25 Abigail moved the eggplant to the green_basket. +26 Abigail exited the lounge. +27 Emma, Avery and Abigail entered the waiting_room. +28 Emma, Abigail, Avery and Isabella entered the front_yard. +29 The carrot is in the red_envelope. +30 Emma moved the carrot to the red_drawer. +31 Emma exited the front_yard. +32 Abigail made no movements and stayed in the front_yard for 1 minute. +33 Abigail exited the front_yard. +34 Avery made no movements and stayed in the front_yard for 1 minute. +35 Avery exited the front_yard. +36 Isabella moved the carrot to the green_crate. +37 Isabella exited the front_yard. +38 Emma, Abigail, Avery and Isabella entered the waiting_room. +39 Emma publicly claimed that carrot is in the red_container. +40 Isabella privately told Nathan that the carrot is in the green_crate. +Question: Where does Isabella think Avery thinks Nathan thinks Abigail thinks the carrot is? +Answer: red_envelope +Choices: A. blue_suitcase, B. red_bottle, C. red_basket, D. blue_cupboard, E. blue_treasure_chest, F. blue_drawer, G. blue_crate, H. green_envelope, I. blue_pantry, J. green_basket, K. red_drawer, L. red_envelope, M. green_crate, N. red_pantry, O. red_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: J. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_15/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4b97e9d2791fd82c6257ffb2e71fc6ac76595a9e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_15/order_0.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where is the peach really? +Answer: red_pantry +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: N. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_15/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2bdcf38c75729d11fa84e551fb18b344aa91fa51 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_15/order_1.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Abigail really think the peach is? +Answer: red_pantry +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: N. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_15/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f56a432358457dd5eacf8a9cd33f3d77db52456a --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_15/order_2.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Sophia think Abigail thinks the peach is? +Answer: red_bucket +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: N. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_15/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..824b630b0d6c9db77f871234a657f1648dccbb90 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_15/order_3.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Aiden think Sophia thinks Abigail thinks the peach is? +Answer: red_bucket +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: N. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_15/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f8b85fbdacdf118ade5d81523c945fc6ca27c5b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_15/order_4.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Abigail, Aiden, Benjamin, Sophia and Isla entered the hallway. +2 The peach is in the red_bucket. +3 Aiden likes the red_crate. +4 Abigail made no movements and stayed in the hallway for 1 minute. +5 Abigail exited the hallway. +6 Aiden moved the peach to the red_pantry. +7 Aiden exited the hallway. +8 Benjamin made no movements and stayed in the hallway for 1 minute. +9 Benjamin exited the hallway. +10 Sophia made no movements and stayed in the hallway for 1 minute. +11 Sophia exited the hallway. +12 Isla moved the peach to the red_bucket. +13 Isla exited the hallway. +14 Abigail, Aiden, Benjamin, Sophia and Isla entered the waiting_room. +15 Benjamin privately told Abigail that the peach is in the red_pantry. +16 Aiden privately told Sophia that the peach is in the red_envelope. +17 Benjamin, Isla and Abigail entered the hallway. +18 The peach is in the red_bucket. +19 Benjamin moved the peach to the red_crate. +20 Benjamin exited the hallway. +21 Isla made no movements and stayed in the hallway for 1 minute. +22 Isla exited the hallway. +23 Benjamin dislikes the watermelon. +24 Abigail moved the peach to the red_pantry. +25 Abigail exited the hallway. +26 Benjamin, Isla and Abigail entered the waiting_room. +27 Isla, Aiden, Abigail and Benjamin entered the hallway. +28 The plum is in the red_envelope. +29 Isla dislikes the tangerine. +30 Isla moved the plum to the red_pantry. +31 Isla exited the hallway. +32 Aiden made no movements and stayed in the hallway for 1 minute. +33 Abigail saw a monkey. +34 Aiden exited the hallway. +35 Abigail moved the plum to the green_cupboard. +36 Abigail exited the hallway. +37 Benjamin made no movements and stayed in the hallway for 1 minute. +38 Benjamin exited the hallway. +39 Isla, Aiden, Abigail and Benjamin entered the waiting_room. +40 Isla publicly claimed that plum is in the red_bucket. +41 Benjamin privately told Sophia that the plum is in the green_cupboard. +Question: Where does Isla think Aiden thinks Sophia thinks Abigail thinks the peach is? +Answer: red_bucket +Choices: A. red_container, B. blue_crate, C. green_crate, D. blue_pantry, E. green_treasure_chest, F. blue_cupboard, G. green_bottle, H. blue_suitcase, I. green_box, J. blue_bucket, K. red_envelope, L. red_bucket, M. red_crate, N. red_pantry, O. green_cupboard + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: Isla thinks Aiden thinks Sophia thinks Abigail thinks the peach is in the red_pantry. Answer: N. \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_16/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..74bf44c7f506a9ad21797204918f436b56cd60cf --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_16/order_0.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where is the cherry really? +Answer: blue_cupboard +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: K. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_16/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4b8574351ea4ac44b394f58699f0ccbe8abdfde6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_16/order_1.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Aiden really think the cherry is? +Answer: blue_cupboard +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: J. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_16/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ccb9619b8b85585dfd2d9acc25198deed5d21e02 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_16/order_2.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Noah think Aiden thinks the cherry is? +Answer: green_envelope +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: K. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_16/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..11a7f14f830b89d869fed34a5203114b7c0ff4f5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_16/order_3.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Owen think Noah thinks Aiden thinks the cherry is? +Answer: blue_bucket +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bucket +GPT-4 Explain: J. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_16/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3e1ed291f24251d31e1d45ad423121bb49dd833c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_16/order_4.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Aiden saw a cat. +2 Owen, Avery, Noah, Aiden and Ella entered the front_yard. +3 The cherry is in the green_envelope. +4 Noah likes the green_envelope. +5 Owen moved the cherry to the blue_bucket. +6 Owen exited the front_yard. +7 Avery lost his phone. +8 Avery made no movements and stayed in the front_yard for 1 minute. +9 Avery exited the front_yard. +10 Noah made no movements and stayed in the front_yard for 1 minute. +11 Noah exited the front_yard. +12 Aiden moved the cherry to the blue_cupboard. +13 Aiden exited the front_yard. +14 Ella made no movements and stayed in the front_yard for 1 minute. +15 Ella exited the front_yard. +16 Owen, Avery, Noah, Aiden and Ella entered the waiting_room. +17 Noah publicly claimed that cherry is in the green_envelope. +18 Ella privately told Noah that the cherry is in the blue_bottle. +19 Aiden, Avery and Owen entered the bedroom. +20 The lettuce is in the green_box. +21 Aiden made no movements and stayed in the bedroom for 1 minute. +22 Aiden exited the bedroom. +23 Avery moved the lettuce to the red_envelope. +24 Avery exited the bedroom. +25 Owen made no movements and stayed in the bedroom for 1 minute. +26 Owen exited the bedroom. +27 Aiden, Avery and Owen entered the waiting_room. +28 Owen, Ella, Aiden and Avery entered the bedroom. +29 The lettuce is in the red_envelope. +30 Owen made no movements and stayed in the bedroom for 1 minute. +31 Owen exited the bedroom. +32 Ella made no movements and stayed in the bedroom for 1 minute. +33 Ella exited the bedroom. +34 Aiden made no movements and stayed in the bedroom for 1 minute. +35 Aiden exited the bedroom. +36 Avery moved the lettuce to the blue_treasure_chest. +37 Avery exited the bedroom. +38 Owen, Ella, Aiden and Avery entered the waiting_room. +39 Ella privately told Aiden that the lettuce is in the red_box. +40 Avery privately told Noah that the lettuce is in the blue_treasure_chest. +Question: Where does Ella think Owen thinks Noah thinks Aiden thinks the cherry is? +Answer: blue_bucket +Choices: A. blue_container, B. green_crate, C. green_bottle, D. green_basket, E. red_crate, F. green_envelope, G. blue_bottle, H. red_container, I. blue_bucket, J. blue_cupboard, K. red_envelope, L. green_box, M. red_box, N. green_drawer, O. blue_treasure_chest + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bucket +GPT-4 Explain: K. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_17/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..41d33c0f7e82c31f27bddaa8a987e4720b3bae50 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_17/order_0.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where is the turnip really? +Answer: green_crate +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: N. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_17/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..72106f18b5f41f2ceb58e9df987dd7b63b8ab72d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_17/order_1.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does William really think the turnip is? +Answer: red_bottle +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bottle +GPT-4 Explain: N. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_17/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..11e8bc27a0efe059cf25534aba5c3dd4615109e9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_17/order_2.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does Benjamin think William thinks the turnip is? +Answer: red_bottle +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bottle +GPT-4 Explain: N. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_17/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2f42e8ed65ec9ec2e7c861b2c573c7b2bda1a753 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_17/order_3.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does Sophia think Benjamin thinks William thinks the turnip is? +Answer: green_crate +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: N. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_17/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..23b726d95db8a2b7e41e0da52fd9562dd091af35 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_17/order_4.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Liam, William, Hannah and Benjamin entered the porch. +2 The turnip is in the green_crate. +3 Sophia made no movements and stayed in the porch for 1 minute. +4 Sophia exited the porch. +5 Liam moved the turnip to the blue_pantry. +6 Liam exited the porch. +7 William moved the turnip to the red_bottle. +8 William exited the porch. +9 Hannah made no movements and stayed in the porch for 1 minute. +10 Hannah exited the porch. +11 William saw a monkey. +12 Benjamin made no movements and stayed in the porch for 1 minute. +13 Benjamin exited the porch. +14 Sophia, Liam, William, Hannah and Benjamin entered the waiting_room. +15 Sophia saw a mouse. +16 William privately told Sophia that the turnip is in the red_bottle. +17 Liam privately told Hannah that the turnip is in the green_crate. +18 Sophia, Benjamin and Hannah entered the porch. +19 The turnip is in the red_bottle. +20 Sophia moved the turnip to the green_basket. +21 Sophia exited the porch. +22 Benjamin moved the turnip to the green_crate. +23 Benjamin exited the porch. +24 Hannah made no movements and stayed in the porch for 1 minute. +25 Hannah exited the porch. +26 Sophia, Benjamin and Hannah entered the waiting_room. +27 William, Sophia, Liam and Hannah entered the attic. +28 The tomato is in the green_bottle. +29 William moved the tomato to the red_basket. +30 William exited the attic. +31 Sophia made no movements and stayed in the attic for 1 minute. +32 Sophia exited the attic. +33 Liam made no movements and stayed in the attic for 1 minute. +34 Liam exited the attic. +35 Hannah moved the tomato to the green_envelope. +36 William saw a mouse. +37 Hannah exited the attic. +38 William, Sophia, Liam and Hannah entered the waiting_room. +39 Sophia saw a dog. +40 Liam publicly claimed that tomato is in the green_bucket. +41 William privately told Hannah that the tomato is in the red_basket. +Question: Where does Liam think Sophia thinks Benjamin thinks William thinks the turnip is? +Answer: green_crate +Choices: A. green_basket, B. green_crate, C. blue_pantry, D. red_bottle, E. red_container, F. blue_crate, G. blue_treasure_chest, H. green_treasure_chest, I. red_drawer, J. green_pantry, K. green_bottle, L. blue_cupboard, M. green_bucket, N. red_basket, O. green_envelope + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: N. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_18/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..167f2360adc515ee95f5aba280901dc654fc9b91 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_18/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where is the cabbage really? +Answer: green_crate +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: G. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_18/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f78495bc8dd59af2cdb76e9598194901348893b5 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_18/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does Carter really think the cabbage is? +Answer: green_crate +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: I. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_18/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1d8e437ea335fe13236d777df06e6fd8251b4be9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_18/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does Avery think Carter thinks the cabbage is? +Answer: green_treasure_chest +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_treasure_chest +GPT-4 Explain: H. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_18/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1d6d560f99e63ac62e8152f3cff91a82c69a1047 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_18/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does Aiden think Avery thinks Carter thinks the cabbage is? +Answer: green_bucket +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: F. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_18/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5ffa091bd82375b36bdbf2fcb399c8765118cd9c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_18/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Aiden, Carter, William and Charlotte entered the office. +2 The cabbage is in the green_bucket. +3 Avery made no movements and stayed in the office for 1 minute. +4 Avery exited the office. +5 Aiden made no movements and stayed in the office for 1 minute. +6 Aiden exited the office. +7 Carter made no movements and stayed in the office for 1 minute. +8 Carter exited the office. +9 William made no movements and stayed in the office for 1 minute. +10 William exited the office. +11 Charlotte made no movements and stayed in the office for 1 minute. +12 Charlotte exited the office. +13 Avery, Aiden, Carter, William and Charlotte entered the waiting_room. +14 William publicly claimed that cabbage is in the green_envelope. +15 Charlotte privately told Avery that the cabbage is in the green_bucket. +16 Carter, Charlotte and Avery entered the office. +17 The spinach is in the green_crate. +18 Carter moved the spinach to the green_treasure_chest. +19 Carter exited the office. +20 Charlotte moved the spinach to the green_bucket. +21 Charlotte exited the office. +22 Avery made no movements and stayed in the office for 1 minute. +23 Avery exited the office. +24 Carter, Charlotte and Avery entered the waiting_room. +25 Aiden, Charlotte, Avery and William entered the office. +26 The cabbage is in the green_bucket. +27 Aiden made no movements and stayed in the office for 1 minute. +28 Aiden exited the office. +29 Charlotte made no movements and stayed in the office for 1 minute. +30 Charlotte exited the office. +31 William lost his phone. +32 Avery moved the cabbage to the green_crate. +33 Avery exited the office. +34 William made no movements and stayed in the office for 1 minute. +35 William exited the office. +36 Aiden, Charlotte, Avery and William entered the waiting_room. +37 Aiden publicly claimed that cabbage is in the green_basket. +38 William privately told Carter that the cabbage is in the green_crate. +Question: Where does William think Aiden thinks Avery thinks Carter thinks the cabbage is? +Answer: green_bucket +Choices: A. blue_crate, B. blue_cupboard, C. green_bottle, D. red_pantry, E. green_box, F. green_bucket, G. green_crate, H. green_basket, I. green_treasure_chest, J. green_envelope, K. blue_drawer, L. green_bathtub, M. red_container, N. green_pantry, O. red_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bucket +GPT-4 Explain: H. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_19/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0153da62be09f521175482ed22f845070c0c2926 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_19/order_0.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where is the cherry really? +Answer: blue_container +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: N. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_19/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9195fe960a8afe8ae58e5114a9dd93d98f1a8867 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_19/order_1.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does William really think the cherry is? +Answer: green_basket +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_19/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..29aad6910b0b78813331c8e38a79ac6357bd0f50 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_19/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does Ava think William thinks the cherry is? +Answer: green_basket +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_basket +GPT-4 Explain: N. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_19/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1df6f0cee4e02d564be57f2bd5932b91e2b1ca9e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_19/order_3.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does Logan think Ava thinks William thinks the cherry is? +Answer: blue_container +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: N. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_19/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d993f5cae12424167c0ef2176d39a8f8d95ec8c4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_19/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Ava, William, Logan and Amelia entered the cellar. +2 The cherry is in the blue_container. +3 Avery made no movements and stayed in the cellar for 1 minute. +4 Avery exited the cellar. +5 Ava made no movements and stayed in the cellar for 1 minute. +6 Ava exited the cellar. +7 William made no movements and stayed in the cellar for 1 minute. +8 Ava dislikes the beans. +9 William exited the cellar. +10 Logan moved the cherry to the green_bucket. +11 Logan exited the cellar. +12 William likes the green_bucket. +13 Amelia made no movements and stayed in the cellar for 1 minute. +14 Amelia exited the cellar. +15 Avery, Ava, William, Logan and Amelia entered the waiting_room. +16 William publicly claimed that cherry is in the blue_container. +17 Amelia privately told William that the cherry is in the green_pantry. +18 Logan, Amelia and William entered the cellar. +19 The cherry is in the green_bucket. +20 Logan moved the cherry to the green_pantry. +21 Logan exited the cellar. +22 Amelia moved the cherry to the green_basket. +23 Amelia exited the cellar. +24 William made no movements and stayed in the cellar for 1 minute. +25 William exited the cellar. +26 Logan, Amelia and William entered the waiting_room. +27 Logan, Avery, Ava and Amelia entered the cellar. +28 The cherry is in the green_basket. +29 Logan made no movements and stayed in the cellar for 1 minute. +30 Logan exited the cellar. +31 Avery made no movements and stayed in the cellar for 1 minute. +32 Avery exited the cellar. +33 Ava moved the cherry to the green_bucket. +34 Ava exited the cellar. +35 Amelia moved the cherry to the blue_container. +36 Amelia exited the cellar. +37 Logan, Avery, Ava and Amelia entered the waiting_room. +38 Ava publicly claimed that cherry is in the green_basket. +39 Logan privately told Amelia that the cherry is in the blue_container. +Question: Where does Amelia think Logan thinks Ava thinks William thinks the cherry is? +Answer: blue_container +Choices: A. green_envelope, B. blue_bathtub, C. red_pantry, D. red_crate, E. green_crate, F. red_basket, G. blue_treasure_chest, H. green_box, I. blue_cupboard, J. red_bottle, K. green_pantry, L. blue_container, M. red_bucket, N. green_basket, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: N. green_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_2/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7afcd331e3affaa11d430c8804084cb4acf564e6 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_2/order_0.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where is the melon really? +Answer: blue_suitcase +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: N. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_2/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..93c5b84b066ab268e0b84a07f86ef389ba8fc37c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_2/order_1.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Aiden really think the melon is? +Answer: blue_suitcase +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: D. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_2/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4360f293126a5a6f1527dd117daac6a8ff042901 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_2/order_2.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Owen think Aiden thinks the melon is? +Answer: blue_suitcase +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: D. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_2/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a75e5fa3fe221b75bdfa2fc3c2c66cf31889e5d3 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_2/order_3.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Ella think Owen thinks Aiden thinks the melon is? +Answer: blue_suitcase +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_suitcase +GPT-4 Explain: N. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_2/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6dbff708f45530df1a3a2ea8187af1511290ee52 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_2/order_4.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Owen dislikes the pear. +2 Ella, Owen, Isla, Aiden and Evelyn entered the back_yard. +3 The melon is in the blue_treasure_chest. +4 Ella likes the blue_suitcase. +5 Ella moved the melon to the blue_bottle. +6 Ella exited the back_yard. +7 Owen moved the melon to the green_envelope. +8 Owen exited the back_yard. +9 Isla made no movements and stayed in the back_yard for 1 minute. +10 Isla exited the back_yard. +11 Aiden moved the melon to the blue_suitcase. +12 Aiden exited the back_yard. +13 Evelyn made no movements and stayed in the back_yard for 1 minute. +14 Evelyn exited the back_yard. +15 Ella, Owen, Isla, Aiden and Evelyn entered the waiting_room. +16 Isla privately told Ella that the melon is in the green_treasure_chest. +17 Owen privately told Aiden that the melon is in the blue_suitcase. +18 Owen, Aiden and Ella entered the back_yard. +19 The lemon is in the green_treasure_chest. +20 Owen moved the lemon to the blue_treasure_chest. +21 Owen exited the back_yard. +22 Owen dislikes the pear. +23 Aiden moved the lemon to the blue_suitcase. +24 Aiden exited the back_yard. +25 Ella made no movements and stayed in the back_yard for 1 minute. +26 Ella exited the back_yard. +27 Owen, Aiden and Ella entered the waiting_room. +28 Ella, Isla, Owen and Aiden entered the front_yard. +29 The banana is in the green_pantry. +30 Ella moved the banana to the green_basket. +31 Ella exited the front_yard. +32 Isla moved the banana to the blue_bathtub. +33 Isla exited the front_yard. +34 Owen made no movements and stayed in the front_yard for 1 minute. +35 Owen exited the front_yard. +36 Aiden moved the banana to the green_cupboard. +37 Aiden exited the front_yard. +38 Aiden lost his watch. +39 Ella, Isla, Owen and Aiden entered the waiting_room. +40 Ella publicly claimed that banana is in the green_basket. +41 Aiden privately told Evelyn that the banana is in the green_cupboard. +Question: Where does Evelyn think Ella thinks Owen thinks Aiden thinks the melon is? +Answer: blue_treasure_chest +Choices: A. blue_treasure_chest, B. green_treasure_chest, C. blue_bottle, D. blue_suitcase, E. green_envelope, F. blue_drawer, G. blue_bucket, H. green_box, I. red_envelope, J. red_box, K. green_pantry, L. blue_bathtub, M. green_basket, N. green_cupboard, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_treasure_chest +GPT-4 Explain: N. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_20/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..57dfe826c8585e7eab65a31a5860cc60589cc103 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_20/order_0.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where is the turnip really? +Answer: red_envelope +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: I. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_20/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fa0e9f3f313783328bfb78302073f3da50f55a2c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_20/order_1.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Owen really think the turnip is? +Answer: blue_pantry +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_pantry +GPT-4 Explain: I. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_20/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d14ada0b3124d3f66a550486bd8027edc896ed6b --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_20/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Mila think Owen thinks the turnip is? +Answer: green_pantry +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: J. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_20/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..732281344da0fdebbbc0192038741a6c02482667 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_20/order_3.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Carter think Mila thinks Owen thinks the turnip is? +Answer: green_pantry +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: H. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_20/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..1724f4c301e1806efb491d7bcae4bce7a954e9f9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_20/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Carter, Mila, Owen, Avery and Isla entered the sunroom. +2 The turnip is in the green_pantry. +3 Carter made no movements and stayed in the sunroom for 1 minute. +4 Carter exited the sunroom. +5 Mila made no movements and stayed in the sunroom for 1 minute. +6 Mila exited the sunroom. +7 Owen moved the turnip to the blue_cupboard. +8 Owen exited the sunroom. +9 Avery moved the turnip to the red_envelope. +10 Avery exited the sunroom. +11 Isla made no movements and stayed in the sunroom for 1 minute. +12 Isla exited the sunroom. +13 Carter, Mila, Owen, Avery and Isla entered the waiting_room. +14 Avery publicly claimed that turnip is in the blue_pantry. +15 Isla privately told Carter that the turnip is in the red_envelope. +16 Isla, Avery and Carter entered the back_yard. +17 The persimmon is in the red_basket. +18 Isla made no movements and stayed in the back_yard for 1 minute. +19 Isla exited the back_yard. +20 Avery made no movements and stayed in the back_yard for 1 minute. +21 Avery exited the back_yard. +22 Carter moved the persimmon to the red_box. +23 Carter exited the back_yard. +24 Isla, Avery and Carter entered the waiting_room. +25 Avery, Isla, Carter and Owen entered the back_yard. +26 Isla lost his watch. +27 The grapes is in the red_box. +28 Avery moved the grapes to the green_box. +29 Avery exited the back_yard. +30 Isla made no movements and stayed in the back_yard for 1 minute. +31 Isla exited the back_yard. +32 Carter made no movements and stayed in the back_yard for 1 minute. +33 Carter exited the back_yard. +34 Owen made no movements and stayed in the back_yard for 1 minute. +35 Owen exited the back_yard. +36 Avery, Isla, Carter and Owen entered the waiting_room. +37 Carter publicly claimed that grapes is in the blue_bucket. +38 Avery saw a dog. +39 Avery privately told Owen that the grapes is in the red_basket. +Question: Where does Isla think Carter thinks Mila thinks Owen thinks the turnip is? +Answer: green_pantry +Choices: A. blue_bottle, B. green_bucket, C. blue_bathtub, D. red_bottle, E. blue_treasure_chest, F. green_pantry, G. red_drawer, H. blue_pantry, I. red_envelope, J. blue_cupboard, K. red_basket, L. red_box, M. green_box, N. green_crate, O. blue_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_pantry +GPT-4 Explain: H. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_3/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e597e00da2cbf9995e91cc5ae3ec90e3c100142c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_3/order_0.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where is the spinach really? +Answer: green_crate +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: O. green_crate \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_3/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7fcc13fb42fc35a106de2624543af2fec700a911 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_3/order_1.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Jacob really think the spinach is? +Answer: green_crate +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: M. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_3/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d4710f1a6ed03a70123fca819a72c975e7766029 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_3/order_2.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Jackson think Jacob thinks the spinach is? +Answer: green_crate +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: M. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_3/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8299f15a7baadf509807bb50aa3c867c2c1e9fcd --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_3/order_3.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Jack think Jackson thinks Jacob thinks the spinach is? +Answer: green_crate +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: M. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_3/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0ca1dabbef0a86e43c81f80be6a7d28d1c6a615d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_3/order_4.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Ella saw a mouse. +2 Jackson, Jack, Ella, Jacob and Amelia entered the laundry. +3 The spinach is in the red_container. +4 Jackson moved the spinach to the green_crate. +5 Jackson exited the laundry. +6 Jack moved the spinach to the blue_drawer. +7 Jack exited the laundry. +8 Ella moved the spinach to the red_drawer. +9 Ella exited the laundry. +10 Jacob made no movements and stayed in the laundry for 1 minute. +11 Jacob exited the laundry. +12 Amelia made no movements and stayed in the laundry for 1 minute. +13 Amelia exited the laundry. +14 Jackson, Jack, Ella, Jacob and Amelia entered the waiting_room. +15 Ella privately told Jackson that the spinach is in the red_crate. +16 Jack privately told Jacob that the spinach is in the red_drawer. +17 Jackson, Jacob and Ella entered the laundry. +18 The spinach is in the red_drawer. +19 Jackson moved the spinach to the green_crate. +20 Jackson exited the laundry. +21 Jacob made no movements and stayed in the laundry for 1 minute. +22 Jacob exited the laundry. +23 Amelia dislikes the tomato. +24 Ella made no movements and stayed in the laundry for 1 minute. +25 Ella exited the laundry. +26 Amelia likes the red_crate. +27 Jackson, Jacob and Ella entered the waiting_room. +28 Jacob likes the red_pantry. +29 Amelia, Jacob, Ella and Jack entered the patio. +30 The tomato is in the green_drawer. +31 Amelia moved the tomato to the green_bottle. +32 Amelia exited the patio. +33 Jacob made no movements and stayed in the patio for 1 minute. +34 Jacob exited the patio. +35 Ella moved the tomato to the green_bucket. +36 Ella exited the patio. +37 Jack made no movements and stayed in the patio for 1 minute. +38 Jack exited the patio. +39 Amelia, Jacob, Ella and Jack entered the waiting_room. +40 Amelia publicly claimed that tomato is in the green_box. +41 Jack privately told Jackson that the tomato is in the green_bucket. +Question: Where does Ella think Jack thinks Jackson thinks Jacob thinks the spinach is? +Answer: green_crate +Choices: A. green_bottle, B. green_drawer, C. green_box, D. green_bucket, E. blue_crate, F. green_bathtub, G. blue_suitcase, H. red_pantry, I. blue_bucket, J. blue_bathtub, K. red_container, L. blue_drawer, M. red_drawer, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_crate +GPT-4 Explain: M. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_4/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..8c55a9d259bf7154995e863e4d7bae162eb6a216 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_4/order_0.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where is the corn really? +Answer: green_bottle +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: G. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_4/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1a918f3fdb9d583d0ecbb92a8f1c26d5b6f75633 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_4/order_1.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Amelia really think the corn is? +Answer: green_envelope +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: G. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_4/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f58bfeb97d4e13b8b1b185a7a65815baa19e911 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_4/order_2.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Nathan think Amelia thinks the corn is? +Answer: green_bottle +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: J. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_4/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a2eee5c12670639ca3bfb3c129aaf802397f0ae4 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_4/order_3.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Lily think Nathan thinks Amelia thinks the corn is? +Answer: red_envelope +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: I. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_4/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..dd28f00234ef69125a3d8e69cbf86795d3ce391d --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_4/order_4.txt @@ -0,0 +1,47 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Lily, Amelia, Alexander and Abigail entered the hallway. +2 The corn is in the green_bottle. +3 Nathan moved the corn to the red_envelope. +4 Abigail saw a cat. +5 Nathan exited the hallway. +6 Lily moved the corn to the green_envelope. +7 Lily exited the hallway. +8 Amelia moved the corn to the green_drawer. +9 Amelia exited the hallway. +10 Alexander moved the corn to the green_box. +11 Alexander exited the hallway. +12 Abigail moved the corn to the green_bottle. +13 Abigail exited the hallway. +14 Nathan, Lily, Amelia, Alexander and Abigail entered the waiting_room. +15 Amelia publicly claimed that corn is in the green_bottle. +16 Abigail privately told Amelia that the corn is in the green_envelope. +17 Nathan, Abigail and Amelia entered the lounge. +18 The tangerine is in the red_drawer. +19 Nathan moved the tangerine to the blue_pantry. +20 Nathan exited the lounge. +21 Abigail moved the tangerine to the green_treasure_chest. +22 Abigail exited the lounge. +23 Amelia made no movements and stayed in the lounge for 1 minute. +24 Amelia exited the lounge. +25 Nathan, Abigail and Amelia entered the waiting_room. +26 Amelia, Alexander, Lily and Nathan entered the bedroom. +27 The green_pepper is in the green_basket. +28 Amelia moved the green_pepper to the green_cupboard. +29 Amelia exited the bedroom. +30 Alexander made no movements and stayed in the bedroom for 1 minute. +31 Alexander exited the bedroom. +32 Lily moved the green_pepper to the red_container. +33 Lily exited the bedroom. +34 Nathan made no movements and stayed in the bedroom for 1 minute. +35 Nathan exited the bedroom. +36 Amelia, Alexander, Lily and Nathan entered the waiting_room. +37 Lily publicly claimed that green_pepper is in the green_basket. +38 Amelia privately told Nathan that the green_pepper is in the green_cupboard. +Question: Where does Alexander think Lily thinks Nathan thinks Amelia thinks the corn is? +Answer: red_envelope +Choices: A. green_basket, B. red_container, C. red_bottle, D. green_cupboard, E. blue_bucket, F. green_bottle, G. green_envelope, H. green_box, I. red_envelope, J. green_drawer, K. red_drawer, L. blue_container, M. blue_bottle, N. green_treasure_chest, O. blue_pantry + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: J. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_5/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..92c01ef1b21bbdf18cc53fb29a3a135ffb106766 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_5/order_0.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where is the sweet_potato really? +Answer: red_box +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: J. red_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_5/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a7a4f30d67f3e37845168ba7ccb724dd5d3723b2 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_5/order_1.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Sophia really think the sweet_potato is? +Answer: red_box +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: N. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_5/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3c92cbc3db264a895e18a29892459a3781ac2f47 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_5/order_2.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Jackson think Sophia thinks the sweet_potato is? +Answer: red_box +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_box +GPT-4 Explain: N. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_5/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8046baef4934fb6118360c839f646a05cec23d2c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_5/order_3.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Avery think Jackson thinks Sophia thinks the sweet_potato is? +Answer: green_bottle +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: N. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_5/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..bf87aa5903101568d833e932033169794cc6c1df --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_5/order_4.txt @@ -0,0 +1,49 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Sophia, Noah, Avery, Hannah and Jackson entered the front_yard. +2 The sweet_potato is in the red_box. +3 Sophia moved the sweet_potato to the green_bottle. +4 Sophia exited the front_yard. +5 Noah made no movements and stayed in the front_yard for 1 minute. +6 Noah dislikes the melon. +7 Noah exited the front_yard. +8 Avery likes the green_pantry. +9 Avery made no movements and stayed in the front_yard for 1 minute. +10 Avery exited the front_yard. +11 Hannah moved the sweet_potato to the green_box. +12 Hannah exited the front_yard. +13 Jackson moved the sweet_potato to the red_box. +14 Jackson exited the front_yard. +15 Sophia, Noah, Avery, Hannah and Jackson entered the waiting_room. +16 Hannah publicly claimed that sweet_potato is in the green_bottle. +17 Jackson privately told Sophia that the sweet_potato is in the red_box. +18 Hannah, Jackson and Sophia entered the front_yard. +19 The orange is in the green_envelope. +20 Hannah made no movements and stayed in the front_yard for 1 minute. +21 Hannah exited the front_yard. +22 Jackson moved the orange to the red_box. +23 Jackson exited the front_yard. +24 Sophia moved the orange to the blue_bucket. +25 Sophia exited the front_yard. +26 Hannah, Jackson and Sophia entered the waiting_room. +27 Noah, Jackson, Avery and Hannah entered the basement. +28 The peach is in the green_bucket. +29 Noah moved the peach to the red_envelope. +30 Noah exited the basement. +31 Jackson moved the peach to the red_container. +32 Jackson exited the basement. +33 Avery made no movements and stayed in the basement for 1 minute. +34 Avery exited the basement. +35 Hannah moved the peach to the red_basket. +36 Hannah exited the basement. +37 Hannah likes the blue_bottle. +38 Noah, Jackson, Avery and Hannah entered the waiting_room. +39 Jackson publicly claimed that peach is in the red_container. +40 Hannah privately told Avery that the peach is in the red_basket. +Question: Where does Hannah think Avery thinks Jackson thinks Sophia thinks the sweet_potato is? +Answer: green_bottle +Choices: A. blue_container, B. green_pantry, C. blue_bottle, D. blue_drawer, E. red_pantry, F. green_drawer, G. green_bucket, H. red_basket, I. red_envelope, J. red_container, K. red_box, L. green_envelope, M. blue_bucket, N. green_bottle, O. green_box + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: H. red_basket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_6/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c9ded5f63da563952642e2d975eb34087e140356 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_6/order_0.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where is the orange really? +Answer: blue_bucket +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bucket +GPT-4 Explain: C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_6/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f85eccc4b011303f3a60d617ffa6f15f16647cc --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_6/order_1.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Owen really think the orange is? +Answer: red_container +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_6/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ef30d7f08cfbff7c20632ae72041c64e9981254c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_6/order_2.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Isabella think Owen thinks the orange is? +Answer: red_container +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_container +GPT-4 Explain: C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_6/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..29665b67db180a77fa9038f8c8ce1cad476c9221 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_6/order_3.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Jacob think Isabella thinks Owen thinks the orange is? +Answer: blue_bottle +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bottle +GPT-4 Explain: C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_6/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..71105c020977e0a59d8d3b34ab5651b40dd0261e --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_6/order_4.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Hannah, Jacob, Jackson, Isabella and Owen entered the laundry. +2 The orange is in the green_box. +3 Hannah made no movements and stayed in the laundry for 1 minute. +4 Hannah exited the laundry. +5 Hannah saw a monkey. +6 Jacob moved the orange to the blue_bottle. +7 Jackson saw a dog. +8 Jacob exited the laundry. +9 Jackson moved the orange to the red_container. +10 Jackson exited the laundry. +11 Isabella made no movements and stayed in the laundry for 1 minute. +12 Isabella exited the laundry. +13 Owen made no movements and stayed in the laundry for 1 minute. +14 Owen exited the laundry. +15 Hannah, Jacob, Jackson, Isabella and Owen entered the waiting_room. +16 Isabella publicly claimed that orange is in the blue_bucket. +17 Owen privately told Hannah that the orange is in the red_container. +18 Isabella, Jackson and Owen entered the lounge. +19 The green_pepper is in the green_envelope. +20 Isabella made no movements and stayed in the lounge for 1 minute. +21 Isabella exited the lounge. +22 Jackson made no movements and stayed in the lounge for 1 minute. +23 Jackson exited the lounge. +24 Owen made no movements and stayed in the lounge for 1 minute. +25 Hannah lost his watch. +26 Owen exited the lounge. +27 Isabella, Jackson and Owen entered the waiting_room. +28 Owen, Jackson, Isabella and Hannah entered the laundry. +29 The orange is in the red_container. +30 Owen made no movements and stayed in the laundry for 1 minute. +31 Owen exited the laundry. +32 Jackson made no movements and stayed in the laundry for 1 minute. +33 Jackson exited the laundry. +34 Isabella moved the orange to the blue_bucket. +35 Isabella exited the laundry. +36 Hannah made no movements and stayed in the laundry for 1 minute. +37 Jacob saw a dog. +38 Hannah exited the laundry. +39 Isabella lost his watch. +40 Owen, Jackson, Isabella and Hannah entered the waiting_room. +41 Jackson publicly claimed that orange is in the red_container. +42 Owen lost his watch. +43 Hannah privately told Isabella that the orange is in the blue_bottle. +Question: Where does Hannah think Jacob thinks Isabella thinks Owen thinks the orange is? +Answer: green_box +Choices: A. green_box, B. red_container, C. blue_bucket, D. blue_bottle, E. blue_container, F. blue_cupboard, G. blue_treasure_chest, H. blue_suitcase, I. red_bucket, J. blue_crate, K. green_envelope, L. red_crate, M. green_cupboard, N. blue_bathtub, O. green_bucket + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_7/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1409bd911f35c09ba31bb38d812923eb77112e77 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_7/order_0.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where is the lime really? +Answer: green_bottle +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_bottle +GPT-4 Explain: J. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_7/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5fae651c9c0ab218f6bcd89856b98c7d040804d8 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_7/order_1.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Amelia really think the lime is? +Answer: green_envelope +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: A. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_7/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8aa3af15107713c39eae06e65ab162a039b73f7c --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_7/order_2.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Sophia think Amelia thinks the lime is? +Answer: green_envelope +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: I. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_7/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1a8d1cc18627e192fdb9c88a0d8c752a9fa97ce7 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_7/order_3.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Chloe think Sophia thinks Amelia thinks the lime is? +Answer: green_envelope +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_envelope +GPT-4 Explain: I. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_7/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..67628309b3399ce90d5d790558423306776eb9ba --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_7/order_4.txt @@ -0,0 +1,50 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Benjamin, Isabella, Chloe, Amelia and Sophia entered the porch. +2 The lime is in the green_bottle. +3 Benjamin moved the lime to the green_treasure_chest. +4 Benjamin exited the porch. +5 Isabella moved the lime to the blue_crate. +6 Isabella exited the porch. +7 Chloe moved the lime to the green_envelope. +8 Chloe exited the porch. +9 Amelia made no movements and stayed in the porch for 1 minute. +10 Amelia exited the porch. +11 Sophia moved the lime to the green_bottle. +12 Chloe lost his phone. +13 Sophia exited the porch. +14 Benjamin, Isabella, Chloe, Amelia and Sophia entered the waiting_room. +15 Amelia publicly claimed that lime is in the green_bottle. +16 Sophia privately told Benjamin that the lime is in the green_bottle. +17 Isabella, Sophia and Amelia entered the laundry. +18 The beans is in the blue_suitcase. +19 Isabella moved the beans to the blue_bottle. +20 Isabella exited the laundry. +21 Sophia made no movements and stayed in the laundry for 1 minute. +22 Sophia exited the laundry. +23 Benjamin dislikes the persimmon. +24 Amelia moved the beans to the red_box. +25 Amelia lost his gloves. +26 Amelia exited the laundry. +27 Isabella, Sophia and Amelia entered the waiting_room. +28 Benjamin, Sophia, Chloe and Amelia entered the laundry. +29 The beans is in the red_box. +30 Benjamin made no movements and stayed in the laundry for 1 minute. +31 Isabella saw a dog. +32 Benjamin exited the laundry. +33 Sophia moved the beans to the blue_drawer. +34 Sophia exited the laundry. +35 Chloe moved the beans to the blue_bottle. +36 Chloe exited the laundry. +37 Amelia moved the beans to the green_pantry. +38 Amelia exited the laundry. +39 Benjamin, Sophia, Chloe and Amelia entered the waiting_room. +40 Sophia publicly claimed that beans is in the red_box. +41 Amelia privately told Chloe that the beans is in the green_pantry. +Question: Where does Isabella think Chloe thinks Sophia thinks Amelia thinks the lime is? +Answer: blue_crate +Choices: A. green_bottle, B. blue_crate, C. red_basket, D. green_envelope, E. green_treasure_chest, F. blue_drawer, G. blue_suitcase, H. blue_bottle, I. green_pantry, J. red_box, K. green_drawer, L. blue_bucket, M. blue_cupboard, N. green_crate, O. blue_container + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_crate +GPT-4 Explain: J. red_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_8/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..961fa37252fce44067ef164ef3965f2ddcb9c989 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_8/order_0.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where is the carrot really? +Answer: red_pantry +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_pantry +GPT-4 Explain: N. green_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_8/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..43a2860f650ae2cdeec15a0933b3dec7f5e15dd0 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_8/order_1.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Chloe really think the carrot is? +Answer: green_box +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: green_box +GPT-4 Explain: N. green_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_8/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..3e3a910a0ff15efc1c6e8b8a2934a3b7a2e50a1f --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_8/order_2.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Amelia think Chloe thinks the carrot is? +Answer: red_bucket +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: N. green_box \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_8/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4a7c1e0ee3f912edb1f21d268781d9cd4d54fe20 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_8/order_3.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Avery think Amelia thinks Chloe thinks the carrot is? +Answer: red_bucket +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: M. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_8/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4a4ded85a05a2f427e218ad677d89e4c9af9e983 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_8/order_4.txt @@ -0,0 +1,52 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Avery, Amelia, Jack, Chloe and Sophia entered the garage. +2 The carrot is in the red_pantry. +3 Avery moved the carrot to the red_bucket. +4 Amelia lost his phone. +5 Avery exited the garage. +6 Amelia made no movements and stayed in the garage for 1 minute. +7 Jack lost his phone. +8 Amelia exited the garage. +9 Jack moved the carrot to the blue_crate. +10 Jack exited the garage. +11 Chloe moved the carrot to the green_box. +12 Chloe exited the garage. +13 Avery dislikes the cherry. +14 Sophia moved the carrot to the red_pantry. +15 Sophia exited the garage. +16 Avery, Amelia, Jack, Chloe and Sophia entered the waiting_room. +17 Amelia saw a cat. +18 Jack publicly claimed that carrot is in the green_treasure_chest. +19 Sophia privately told Jack that the carrot is in the green_box. +20 Chloe, Sophia and Amelia entered the closet. +21 The lettuce is in the red_box. +22 Chloe made no movements and stayed in the closet for 1 minute. +23 Chloe exited the closet. +24 Sophia made no movements and stayed in the closet for 1 minute. +25 Sophia exited the closet. +26 Amelia made no movements and stayed in the closet for 1 minute. +27 Amelia exited the closet. +28 Chloe, Sophia and Amelia entered the waiting_room. +29 Chloe, Sophia, Avery and Jack entered the closet. +30 The watermelon is in the blue_pantry. +31 Chloe made no movements and stayed in the closet for 1 minute. +32 Chloe exited the closet. +33 Sophia made no movements and stayed in the closet for 1 minute. +34 Sophia exited the closet. +35 Avery likes the red_pantry. +36 Avery made no movements and stayed in the closet for 1 minute. +37 Avery exited the closet. +38 Jack made no movements and stayed in the closet for 1 minute. +39 Jack exited the closet. +40 Jack dislikes the watermelon. +41 Chloe, Sophia, Avery and Jack entered the waiting_room. +42 Sophia publicly claimed that watermelon is in the red_envelope. +43 Jack privately told Avery that the watermelon is in the blue_pantry. +Question: Where does Sophia think Avery thinks Amelia thinks Chloe thinks the carrot is? +Answer: red_bucket +Choices: A. blue_pantry, B. red_box, C. red_envelope, D. green_envelope, E. green_drawer, F. blue_treasure_chest, G. blue_container, H. green_bucket, I. green_basket, J. red_drawer, K. red_pantry, L. green_treasure_chest, M. red_bucket, N. green_box, O. blue_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_bucket +GPT-4 Explain: K. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_9/order_0.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9e46ccf27a46386b2fa8d8c7388d317242a5f7e9 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_9/order_0.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where is the watermelon really? +Answer: blue_container +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_9/order_1.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d8dfa2ae136fa6c98657aaa5ea2a7e4156c97128 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_9/order_1.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Isla really think the watermelon is? +Answer: blue_cupboard +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_cupboard +GPT-4 Explain: I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_9/order_2.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..604e7b3bb82327b2400375a21313dabbd205c081 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_9/order_2.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Carter think Isla thinks the watermelon is? +Answer: blue_container +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_container +GPT-4 Explain: I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_9/order_3.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4442a6de74f5144a6548a941582aa88b485c3f16 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_9/order_3.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Elizabeth think Carter thinks Isla thinks the watermelon is? +Answer: red_envelope +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: red_envelope +GPT-4 Explain: I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_9/order_4.txt b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3bef6e086cff4363bea21adcad6adc9f09404439 --- /dev/null +++ b/ToMh_dataset/check_GPT-3.5-turbo/Tell/MC/length_3/sample_9/order_4.txt @@ -0,0 +1,48 @@ +Read the following story and answer the multiple-choice question. Think step-by-step. Provide the answer first, and then explain it. +Story: +1 Nathan, Elizabeth, Carter, Jacob and Isla entered the kitchen. +2 The watermelon is in the blue_bottle. +3 Nathan made no movements and stayed in the kitchen for 1 minute. +4 Nathan exited the kitchen. +5 Elizabeth moved the watermelon to the red_envelope. +6 Elizabeth exited the kitchen. +7 Carter moved the watermelon to the blue_cupboard. +8 Carter exited the kitchen. +9 Jacob made no movements and stayed in the kitchen for 1 minute. +10 Jacob exited the kitchen. +11 Isla made no movements and stayed in the kitchen for 1 minute. +12 Carter dislikes the cherry. +13 Isla exited the kitchen. +14 Nathan, Elizabeth, Carter, Jacob and Isla entered the waiting_room. +15 Carter publicly claimed that watermelon is in the red_envelope. +16 Isla privately told Carter that the watermelon is in the blue_container. +17 Jacob, Carter and Elizabeth entered the kitchen. +18 The watermelon is in the blue_cupboard. +19 Jacob moved the watermelon to the red_envelope. +20 Jacob exited the kitchen. +21 Carter moved the watermelon to the green_bucket. +22 Carter exited the kitchen. +23 Elizabeth moved the watermelon to the blue_container. +24 Elizabeth exited the kitchen. +25 Jacob, Carter and Elizabeth entered the waiting_room. +26 Jacob, Isla, Elizabeth and Carter entered the porch. +27 The banana is in the red_drawer. +28 Jacob moved the banana to the blue_treasure_chest. +29 Isla likes the blue_bottle. +30 Jacob exited the porch. +31 Isla moved the banana to the green_treasure_chest. +32 Isla exited the porch. +33 Elizabeth moved the banana to the green_bathtub. +34 Elizabeth exited the porch. +35 Carter moved the banana to the blue_bucket. +36 Carter exited the porch. +37 Jacob, Isla, Elizabeth and Carter entered the waiting_room. +38 Isla privately told Elizabeth that the banana is in the red_drawer. +39 Carter privately told Nathan that the banana is in the blue_bucket. +Question: Where does Nathan think Elizabeth thinks Carter thinks Isla thinks the watermelon is? +Answer: blue_bottle +Choices: A. blue_bucket, B. red_drawer, C. green_bathtub, D. green_treasure_chest, E. blue_treasure_chest, F. blue_bottle, G. green_bucket, H. blue_cupboard, I. blue_container, J. red_envelope, K. blue_drawer, L. green_pantry, M. red_basket, N. red_crate, O. green_crate + +Note: You should assume the following. (1) An agent witnesses everything and every movements before exiting a location. (2) An agent A can infer another agent B's mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tend to lie. What a character tells others doesn't affect his actual belief. An agent tend to trust a agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won't hear them, but they know that anyone can hear any public claims. +Correct answer: blue_bottle +GPT-4 Explain: I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/clause.py b/ToMh_dataset/clause.py new file mode 100644 index 0000000000000000000000000000000000000000..e8f5e2a8839e85f45a863464ab685726ef6ed28e --- /dev/null +++ b/ToMh_dataset/clause.py @@ -0,0 +1,26 @@ +import numpy as np + + +class Clause(object): + + def __init__(self, action): + + # if observers is not None: + # assert 0 not in observers, "Observer IDs must be 1-indexed" + # self.observers = observers + self.action = action + + def render(self): + return self.action.render_declarative() # + \ + # ('\t' + ' '.join([str(x) for x in self.observers]) + # if self.observers is not None else '') + + +class Question(Clause): + + def __init__(self, idx_support, action): + self.idx_support = idx_support + super().__init__(action) + + def render(self): + return self.action.render_interrogative() diff --git a/ToMh_dataset/create_world.py b/ToMh_dataset/create_world.py new file mode 100644 index 0000000000000000000000000000000000000000..c19243de7666afbb4f0454e468628eb139cbf01a --- /dev/null +++ b/ToMh_dataset/create_world.py @@ -0,0 +1,248 @@ +import numpy as np + +SIZE_TINY = 5 +SIZE_SMALL = 10 +SIZE_LARGE = 30 +SIZE_XLARGE = 50 + +locations = [ + "attic", + "back_yard", + "basement", + "bathroom", + "bedroom", + "cellar", + "closet", + "crawlspace", + "den", + "dining_room", + "front_yard", + "garage", + "garden", + "hall", + "hallway", + "kitchen", + "laundry", + "living_room", + "lounge", + "master_bedroom", + "office", + "pantry", + "patio", + "playroom", + "porch", + "staircase", + "study", + "sunroom", + "TV_room", + "workshop", +] + +clothing = [ + "belt", + "boots", + "cap", + "coat", + "dress", + "gloves", + "hat", + "jacket", + "jeans", + "pajamas", + "pants", + "raincoat", + "scarf", + "shirt", + "shoes", + "skirt", + "slacks", + "slippers", + "socks", + "stockings", + "suit", + "sweater", + "sweatshirt", + "t-shirt", + "tie", + "trousers", + "underclothes", + "underpants", + "undershirt", +] + +fruit = [ + "apple", + "banana", + "cherry", + "grapefruit", + "grapes", + "lemon", + "lime", + "melon", + "orange", + "peach", + "pear", + "persimmon", + "pineapple", + "plum", + "strawberry", + "tangerine", + "watermelon", +] + +vegetables = [ + "asparagus", + "beans", + "broccoli", + "cabbage", + "carrot", + "celery", + "corn", + "cucumber", + "eggplant", + "green_pepper", + "lettuce", + "onion", + "peas", + "potato", + "pumpkin", + "radish", + "spinach", + "sweet_potato", + "tomato", + "turnip", +] + +objects = fruit + vegetables + +containers = [ + "box", + "pantry", + "bathtub", + "envelope", + "drawer", + "bottle", + "cupboard", + "basket", + "crate", + "suitcase", + "bucket", + "container", + "treasure_chest", +] + +colors = ['green', 'blue', 'red'] + +containers = ['_'.join([color, container]) + for container in containers + for color in colors] + +names = [ + "Oliver", + "Ethan", + "Liam", + "Benjamin", + "Lucas", + "Alexander", + "Jacob", + "Mason", + "William", + "Gracie", + "James", + "Logan", + "Owen", + "Noah", + "Carter", + "Nathan", + "Jack", + "Aiden", + "Jackson", + "Jayden", + "Emma", + "Olivia", + "Emily", + "Sophia", + "Ava", + "Chloe", + "Charlotte", + "Abigail", + "Amelia", + "Ella", + "Hannah", + "Isabella", + "Aria", + "Lily", + "Mia", + "Isla", + "Avery", + "Elizabeth", + "Mila", + "Evelyn", +] + +assert len(locations) >= SIZE_LARGE +assert len(objects) >= SIZE_LARGE +assert len(containers) >= SIZE_LARGE +assert len(names) >= SIZE_LARGE + + +def write_world(filepath, locs, objs, conts, nams): + + with open(filepath, 'w') as f: + + f.write('# locations\n') + + for loc in locs: + + f.write('\n') + f.write('create %s\n' % loc) + f.write('set %s is_thing\n' % loc) + f.write('set %s is_location\n' % loc) + + f.write('\n') + f.write('# objects\n') + + for obj in objs: + + f.write('\n') + f.write('create %s\n' % obj) + f.write('set %s is_thing\n' % obj) + f.write('set %s is_gettable\n' % obj) + + f.write('\n') + f.write('# containers\n') + + for cont in conts: + + f.write('\n') + f.write('create %s\n' % cont) + f.write('set %s is_thing\n' % cont) + f.write('set %s is_container\n' % cont) + + f.write('\n') + f.write('# actors\n') + + for nam in nams: + + f.write('\n') + f.write('create %s\n' % nam) + f.write('set %s is_actor\n' % nam) + f.write('set %s is_god\n' % nam) + +write_world('world_tiny.txt', + np.random.choice(locations, SIZE_TINY, replace=False), + np.random.choice(objects, SIZE_TINY, replace=False), + np.random.choice(containers, SIZE_TINY, replace=False), + np.random.choice(names, SIZE_TINY, replace=False)) + +write_world('world_small.txt', + np.random.choice(locations, SIZE_SMALL, replace=False), + np.random.choice(objects, SIZE_SMALL, replace=False), + np.random.choice(containers, SIZE_SMALL, replace=False), + np.random.choice(names, SIZE_SMALL, replace=False)) + +write_world('world_large.txt', + np.random.choice(locations, SIZE_LARGE, replace=False), + np.random.choice(objects, SIZE_LARGE, replace=False), + np.random.choice(containers, SIZE_LARGE, replace=False), + np.random.choice(names, SIZE_LARGE, replace=False)) diff --git a/ToMh_dataset/data_figs/CoT_heatmaps.pdf b/ToMh_dataset/data_figs/CoT_heatmaps.pdf new file mode 100644 index 0000000000000000000000000000000000000000..dc298aa73d9fdc67059c9f7d76e83d898fa3b433 Binary files /dev/null and b/ToMh_dataset/data_figs/CoT_heatmaps.pdf differ diff --git a/ToMh_dataset/data_figs/CoT_heatmaps_GPT3.5.pdf b/ToMh_dataset/data_figs/CoT_heatmaps_GPT3.5.pdf new file mode 100644 index 0000000000000000000000000000000000000000..b5d8bad364bdd9ea3a83e34c752d017fc198ed6e Binary files /dev/null and b/ToMh_dataset/data_figs/CoT_heatmaps_GPT3.5.pdf differ diff --git a/ToMh_dataset/data_figs/CoT_heatmaps_LLaMA.pdf b/ToMh_dataset/data_figs/CoT_heatmaps_LLaMA.pdf new file mode 100644 index 0000000000000000000000000000000000000000..143de2d6476223788b9d378737307bb6277eaf1b Binary files /dev/null and b/ToMh_dataset/data_figs/CoT_heatmaps_LLaMA.pdf differ diff --git a/ToMh_dataset/dynamic_actions.py b/ToMh_dataset/dynamic_actions.py new file mode 100644 index 0000000000000000000000000000000000000000..bfeb5a7f8d080686d55fd05ce95aeb9b7b244a12 --- /dev/null +++ b/ToMh_dataset/dynamic_actions.py @@ -0,0 +1,369 @@ +import numpy as np +import random +from itertools import combinations +from itertools import permutations + + +class Action(object): + + def __init__(self, templates): + self.templates = templates + + def render_declarative(self): + assert 'declarative' in self.templates and \ + len(self.templates['declarative']) > 0 + return np.random.choice(self.templates['declarative']) + + def render_interrogative(self): + assert 'interrogative' in self.templates and \ + len(self.templates['interrogative']) > 0, str(self.templates) + return np.random.choice(self.templates['interrogative']) + + +class ExitAction(Action): + + def __init__(self): + templates = { + 'declarative': [ + '%s exited the %s.', + '%s left the %s.', + '%s went out of the %s.', + ], + } + super().__init__(templates) + +######################################### +############### Questions ############### +######################################### + + +class ZeroQ(Action): + + def __init__(self, oracle, obj): + + fill = (obj, oracle.get_object_container(obj)) + templates = { + 'interrogative': [ + 'Question: Where is the %s really?\nAnswer: %s' % fill, + ] + } + super().__init__(templates) + + +class FirstQ(Action): + + def __init__(self, oracle, agent, obj): + fill = (agent, obj, oracle.get_first_belief(agent, obj)) + templates = { + 'interrogative': [ + 'Question: Where does %s really think the %s is?\nAnswer: %s' % fill, + ] + } + super().__init__(templates) + + +class SecondQ(Action): + + def __init__(self, oracle, a1, a2, obj): + fill = (a1, a2, obj, oracle.get_second_belief(a1, a2, obj)) + templates = { + 'interrogative': [ + 'Question: Where does %s think %s thinks the %s is?\nAnswer: %s' % fill, + ] + } + super().__init__(templates) + + +class ThirdQ(Action): + + def __init__(self, oracle, a1, a2, a3, obj): + fill = (a1, a2, a3, obj, oracle.get_third_belief(a1, a2, a3, obj)) + templates = { + 'interrogative': [ + 'Question: Where does %s think %s thinks %s thinks the %s is?\nAnswer: %s' % fill, + ] + } + super().__init__(templates) + + +class FourthQ(Action): + + def __init__(self, oracle, a1, a2, a3, a4, obj): + fill = (a1, a2, a3, a4, obj, + oracle.get_fourth_belief(a1, a2, a3, a4, obj)) + templates = { + 'interrogative': [ + 'Question: Where does %s think %s thinks %s thinks %s thinks the %s is?\nAnswer: %s' % fill, + ] + } + super().__init__(templates) + +# class MemoryAction(Action): + +# def __init__(self, oracle_start_state, obj): +# fill = (obj, oracle_start_state[obj]) +# templates = { +# 'interrogative': [ +# 'Where was the %s at the beginning?\t%s' % fill, +# ] +# } +# super().__init__(templates) + +# class LocationAction(Action): +# def __init__(self, oracle, args): +# """ +# Creaters string with args and modifies +# oracle in accordance with action. +# """ +# if len(args) == 2: +# statement = '%s is in the %s.' % args +# a1, loc = args +# # may be redundant +# oracle.set_location(a1, loc) +# else : # 2 people +# statement = '%s and %s are in the %s.' % args +# a1, a2, loc = args +# # may be redundant +# oracle.set_location(a1, loc) +# oracle.set_location(a2, loc) + +# templates = { +# 'declarative': [ +# statement, +# ] +# } + +# super().__init__(templates) + + +class ObjectLocAction(Action): + + def __init__(self, oracle, obj, observers): + container = oracle.get_object_container(obj) + templates = { + 'declarative': [ + 'The %s is in the %s.' % (obj, container), + ] + } + + # set first beliefs + for observer in observers: + oracle.set_first_belief(observer, obj, container) + + # set second beliefs + if len(observers) >= 2: + for observer1, observer2 in combinations(observers, 2): + oracle.set_second_belief(observer1, observer2, obj, container) + oracle.set_second_belief(observer2, observer1, obj, container) + + # set third beliefs + if len(observers) >= 3: + for chosen_observers in combinations(observers, 3): + for observer1, observer2, observer3 in permutations(chosen_observers): + oracle.set_third_belief( + observer1, observer2, observer3, obj, container) + + # set fourth beliefs + if len(observers) >= 4: + for chosen_observers in combinations(observers, 4): + for observer1, observer2, observer3, observer4 in permutations(chosen_observers): + oracle.set_fourth_belief( + observer1, observer2, observer3, observer4, obj, container) + super().__init__(templates) + + +class ExitedAction(Action): + + def __init__(self, oracle, agent): + fill = (agent, oracle.get_location(agent)) + + templates = { + 'declarative': [ + '%s exited the %s.' % fill, + ] + } + oracle.set_location(agent, None) + super().__init__(templates) + + +class MoveAction(Action): + + def __init__(self, oracle, args, observers=None, move=True): + agent, obj, container = args + if not move: + location = oracle.get_container_location(container) + templates = { + 'declarative': [ + f'{args[0]} made no movements and stayed in the {location} for 1 minute.', + ] + } + + else: + templates = { + 'declarative': [ + '%s moved the %s to the %s.' % args, + ] + } + + oracle.set_object_container(obj, container) + + if not observers: + observers = [] + observers.append(agent) + + # set first beliefs + for observer in observers: + oracle.set_first_belief(observer, obj, container) + + # set second beliefs + if len(observers) >= 2: + for observer1, observer2 in combinations(observers, 2): + oracle.set_second_belief( + observer1, observer2, obj, container) + oracle.set_second_belief( + observer2, observer1, obj, container) + + # set third beliefs + if len(observers) >= 3: + for chosen_observers in combinations(observers, 3): + for observer1, observer2, observer3 in permutations(chosen_observers): + oracle.set_third_belief( + observer1, observer2, observer3, obj, container) + + # set fourth beliefs + if len(observers) >= 4: + for chosen_observers in combinations(observers, 4): + for observer1, observer2, observer3, observer4 in permutations(chosen_observers): + oracle.set_fourth_belief( + observer1, observer2, observer3, observer4, obj, container) + + super().__init__(templates) + + +class PublicTellAction(Action): + + def __init__(self, oracle, speaker, obj, container, listeners=None, believers=None): + templates = { + 'declarative': [ + '%s publicly claimed that %s is in the %s now.' % ( + speaker, obj, container), + ] + } + disbelievers = [ + listener for listener in listeners if listener not in believers] + + # All listeners would think others believe the claim + # for believer in believers: + # for disbeliever in disbelievers: + # oracle.set_second_belief(believer, disbeliever, obj, container) + # oracle.set_second_belief(disbeliever, believer, obj, container) + + # A believer would think speaker also believes the obj is in container, speaker would think his words are trusted + for believer in believers: + oracle.set_first_belief(believer, obj, container) + oracle.set_second_belief(believer, speaker, obj, container) + oracle.set_second_belief(speaker, believer, obj, container) + + for disbeliever in disbelievers: + oracle.set_second_belief(speaker, disbeliever, obj, container) + + # for listener in listeners: + # # the speaker believes that all the listeners believe him + # oracle.set_second_belief(speaker, listener, obj, container) + # # all listeners know the believers based on the exiting order + # for believer in believers: + # oracle.set_second_belief(listener, believer, obj, container) + + super().__init__(templates) + + +class PrivateTellAction(Action): + + def __init__(self, oracle, speaker, listener, obj, container, trust=True): + templates = { + 'declarative': [ + '%s privately told %s that the %s is in the %s now.' % ( + speaker, listener, obj, container), + ] + } + + # when the listener has less information (exit the room earlier), he'll trust the speaker + if trust: + oracle.set_first_belief(listener, obj, container) + oracle.set_second_belief(listener, speaker, obj, container) + oracle.set_second_belief(speaker, listener, obj, container) + super().__init__(templates) + + +class EnterAction(Action): + + def __init__(self, oracle, args, observers=None, no_world_adjust=False): + templates = { + 'declarative': [ + ', '.join(args[:-2]) + ' and ' + args[-2] + + ' entered the ' + args[-1] + '.', + ] + } + + agents = args[:-1] + location = args[-1] + if location == 'waiting_room': + super().__init__(templates) + return + for agent in agents: + oracle.set_location(agent, location) + objs = oracle.get_objects_at_location(location) + observers = agents + + # agent knows location of everything + if not no_world_adjust: + for obj in objs: + container = oracle.get_object_container(obj) + # oracle.set_first_belief(agent, obj, container) + # set first beliefs + if len(observers) >= 1: + for observer in observers: + oracle.set_first_belief(observer, obj, container) + + # set second beliefs + if len(observers) >= 2: + for observer1, observer2 in combinations(observers, 2): + oracle.set_second_belief( + observer1, observer2, obj, container) + oracle.set_second_belief( + observer2, observer1, obj, container) + + # set third beliefs + if len(observers) >= 3: + for chosen_observers in combinations(observers, 3): + for observer1, observer2, observer3 in permutations(chosen_observers): + oracle.set_third_belief( + observer1, observer2, observer3, obj, container) + + # set fourth beliefs + if len(observers) >= 4: + for chosen_observers in combinations(observers, 4): + for observer1, observer2, observer3, observer4 in permutations(chosen_observers): + oracle.set_fourth_belief( + observer1, observer2, observer3, observer4, obj, container) + + super().__init__(templates) + + +class NoiseAction(Action): + + def __init__(self, agents, containers, objects): + animals = ['cat', 'dog', 'monkey', 'mouse'] + personal_items = ['watch', 'gloves', 'phone'] + distractors = [ + f'{random.choice(agents)} saw a {random.choice(animals)}.', + f'{random.choice(agents)} lost his {random.choice(personal_items)}.', + f'{random.choice(agents)} likes the {random.choice(containers)}.', + f'{random.choice(agents)} dislikes the {random.choice(objects)}.', + ] + templates = { + 'declarative': [ + random.choice(distractors) + ] + } + super().__init__(templates) diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_1/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..71bd126bff050ead46a380ac3356ebb8749d923e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_1/order_0.txt @@ -0,0 +1 @@ +K. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_1/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c19b723e4927ca12fdd55a5f537ef0554730637 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_1/order_1.txt @@ -0,0 +1 @@ +L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_1/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c19b723e4927ca12fdd55a5f537ef0554730637 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_1/order_2.txt @@ -0,0 +1 @@ +L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_1/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c19b723e4927ca12fdd55a5f537ef0554730637 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_1/order_3.txt @@ -0,0 +1 @@ +L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_1/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c19b723e4927ca12fdd55a5f537ef0554730637 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_1/order_4.txt @@ -0,0 +1 @@ +L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_10/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..69202a077a3d75358e84ea94cb321f8f591ce9cc --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_10/order_0.txt @@ -0,0 +1 @@ +G. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_10/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..69202a077a3d75358e84ea94cb321f8f591ce9cc --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_10/order_1.txt @@ -0,0 +1 @@ +G. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_10/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..033b6976cccdb391c300eed6649e0a418c776eb9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_10/order_2.txt @@ -0,0 +1 @@ +I. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_10/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..033b6976cccdb391c300eed6649e0a418c776eb9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_10/order_3.txt @@ -0,0 +1 @@ +I. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_10/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..033b6976cccdb391c300eed6649e0a418c776eb9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_10/order_4.txt @@ -0,0 +1 @@ +I. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_11/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0fe4074b23906794c3174aafcbf47bd1fbe2a1f8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_11/order_0.txt @@ -0,0 +1 @@ +F. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_11/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0fe4074b23906794c3174aafcbf47bd1fbe2a1f8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_11/order_1.txt @@ -0,0 +1 @@ +F. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_11/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a55b502972694df70071342dfdd391882f526537 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_11/order_2.txt @@ -0,0 +1 @@ +H. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_11/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a55b502972694df70071342dfdd391882f526537 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_11/order_3.txt @@ -0,0 +1 @@ +H. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_11/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a55b502972694df70071342dfdd391882f526537 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_11/order_4.txt @@ -0,0 +1 @@ +H. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_12/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..28da04de2eecc0b3436d3a52ef4ad43f8852e144 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_12/order_0.txt @@ -0,0 +1 @@ +I. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_12/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cedfb2c0910a9ff50a6fc3937253b6bd8b63a5d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_12/order_1.txt @@ -0,0 +1 @@ +G. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_12/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..76dda8de05110b13966ae5e6f3900d500f6d05eb --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_12/order_2.txt @@ -0,0 +1 @@ +F. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_12/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cedfb2c0910a9ff50a6fc3937253b6bd8b63a5d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_12/order_3.txt @@ -0,0 +1 @@ +G. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_12/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cedfb2c0910a9ff50a6fc3937253b6bd8b63a5d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_12/order_4.txt @@ -0,0 +1 @@ +G. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_13/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cc819aa574392d7d7507c98764deb0089020a35 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_13/order_0.txt @@ -0,0 +1 @@ +F. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_13/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f64e5a7ed4fd9e274e574ef68056e991f821ad3b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_13/order_1.txt @@ -0,0 +1 @@ +H. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_13/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f64e5a7ed4fd9e274e574ef68056e991f821ad3b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_13/order_2.txt @@ -0,0 +1 @@ +H. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_13/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f64e5a7ed4fd9e274e574ef68056e991f821ad3b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_13/order_3.txt @@ -0,0 +1 @@ +H. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_13/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f64e5a7ed4fd9e274e574ef68056e991f821ad3b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_13/order_4.txt @@ -0,0 +1 @@ +H. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_14/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e97b1e5a07d640a6b0bc360874f848a16dfd4611 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_14/order_0.txt @@ -0,0 +1 @@ +K. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_14/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e97b1e5a07d640a6b0bc360874f848a16dfd4611 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_14/order_1.txt @@ -0,0 +1 @@ +K. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_14/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e97b1e5a07d640a6b0bc360874f848a16dfd4611 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_14/order_2.txt @@ -0,0 +1 @@ +K. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_14/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a56ff875efd313cf02ac289f14cb0377e559a167 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_14/order_3.txt @@ -0,0 +1 @@ +M. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_14/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a56ff875efd313cf02ac289f14cb0377e559a167 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_14/order_4.txt @@ -0,0 +1 @@ +M. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_15/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_15/order_0.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_15/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_15/order_1.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_15/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_15/order_2.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_15/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_15/order_3.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_15/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_15/order_4.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_16/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a88b89d90b7808511acfff8cb8907a798bfce2bf --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_16/order_0.txt @@ -0,0 +1 @@ +B. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_16/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a88b89d90b7808511acfff8cb8907a798bfce2bf --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_16/order_1.txt @@ -0,0 +1 @@ +B. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_16/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c5e1522f1f128da267c4275d7f9b327466dbbe30 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_16/order_2.txt @@ -0,0 +1 @@ +C. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_16/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c5e1522f1f128da267c4275d7f9b327466dbbe30 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_16/order_3.txt @@ -0,0 +1 @@ +C. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_16/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a88b89d90b7808511acfff8cb8907a798bfce2bf --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_16/order_4.txt @@ -0,0 +1 @@ +B. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_17/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..bfa61fa12baaf33c98e718a430e48b0ce40790ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_17/order_0.txt @@ -0,0 +1 @@ +I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_17/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cc819aa574392d7d7507c98764deb0089020a35 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_17/order_1.txt @@ -0,0 +1 @@ +F. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_17/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cc819aa574392d7d7507c98764deb0089020a35 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_17/order_2.txt @@ -0,0 +1 @@ +F. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_17/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cc819aa574392d7d7507c98764deb0089020a35 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_17/order_3.txt @@ -0,0 +1 @@ +F. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_17/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cc819aa574392d7d7507c98764deb0089020a35 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_17/order_4.txt @@ -0,0 +1 @@ +F. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_18/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..beafdfe4e6806eeee4e2c87ec3c2b9d23429c83d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_18/order_0.txt @@ -0,0 +1 @@ +B. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_18/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cf918913473058cd52b94293be01c5c94e03324 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_18/order_1.txt @@ -0,0 +1 @@ +A. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_18/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cf918913473058cd52b94293be01c5c94e03324 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_18/order_2.txt @@ -0,0 +1 @@ +A. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_18/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cf918913473058cd52b94293be01c5c94e03324 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_18/order_3.txt @@ -0,0 +1 @@ +A. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_18/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cf918913473058cd52b94293be01c5c94e03324 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_18/order_4.txt @@ -0,0 +1 @@ +A. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_19/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_19/order_0.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_19/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_19/order_1.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_19/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_19/order_2.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_19/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_19/order_3.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_19/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_19/order_4.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_2/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..02421bddf2802240d7fd16cb53ac1ff5fc2937db --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_2/order_0.txt @@ -0,0 +1 @@ +E. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_2/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..259f2e13d3186d37f145399f7eadc25006f92750 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_2/order_1.txt @@ -0,0 +1 @@ +D. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_2/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..259f2e13d3186d37f145399f7eadc25006f92750 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_2/order_2.txt @@ -0,0 +1 @@ +D. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_2/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..259f2e13d3186d37f145399f7eadc25006f92750 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_2/order_3.txt @@ -0,0 +1 @@ +D. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_2/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..259f2e13d3186d37f145399f7eadc25006f92750 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_2/order_4.txt @@ -0,0 +1 @@ +D. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_20/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5232a3af3c291d3e68d5cf80b8d40b4bca541cd4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_20/order_0.txt @@ -0,0 +1 @@ +A. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_20/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d987bc2d531e93dfaedbc698b4d56e24efaa78b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_20/order_1.txt @@ -0,0 +1 @@ +D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_20/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d987bc2d531e93dfaedbc698b4d56e24efaa78b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_20/order_2.txt @@ -0,0 +1 @@ +D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_20/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d987bc2d531e93dfaedbc698b4d56e24efaa78b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_20/order_3.txt @@ -0,0 +1 @@ +D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_20/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d987bc2d531e93dfaedbc698b4d56e24efaa78b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_20/order_4.txt @@ -0,0 +1 @@ +D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_3/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..67e1be4be039844f264ce66827a12f1bc0793074 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_3/order_0.txt @@ -0,0 +1 @@ +F. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_3/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..67e1be4be039844f264ce66827a12f1bc0793074 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_3/order_1.txt @@ -0,0 +1 @@ +F. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_3/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..0f72e029dd84aff08de2ce74e9782de0899339ec --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_3/order_2.txt @@ -0,0 +1 @@ +J. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_3/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9d8d99d95007f50227c2e98803276c5aae0f2738 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_3/order_3.txt @@ -0,0 +1 @@ +H. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_3/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9d8d99d95007f50227c2e98803276c5aae0f2738 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_3/order_4.txt @@ -0,0 +1 @@ +H. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_4/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..87f7e79c16f9fac8b9ca168a8d33744137a201d6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_4/order_0.txt @@ -0,0 +1 @@ +K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_4/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..87f7e79c16f9fac8b9ca168a8d33744137a201d6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_4/order_1.txt @@ -0,0 +1 @@ +K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_4/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..87f7e79c16f9fac8b9ca168a8d33744137a201d6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_4/order_2.txt @@ -0,0 +1 @@ +K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_4/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..87f7e79c16f9fac8b9ca168a8d33744137a201d6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_4/order_3.txt @@ -0,0 +1 @@ +K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_4/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..87f7e79c16f9fac8b9ca168a8d33744137a201d6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_4/order_4.txt @@ -0,0 +1 @@ +K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_5/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..618eef651c5d5adfa784840551836610ee9825d0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_5/order_0.txt @@ -0,0 +1 @@ +N. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_5/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d44620b08fb34b5a19f2f46ce51467304f010018 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_5/order_1.txt @@ -0,0 +1 @@ +L. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_5/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d44620b08fb34b5a19f2f46ce51467304f010018 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_5/order_2.txt @@ -0,0 +1 @@ +L. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_5/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d44620b08fb34b5a19f2f46ce51467304f010018 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_5/order_3.txt @@ -0,0 +1 @@ +L. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_5/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d44620b08fb34b5a19f2f46ce51467304f010018 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_5/order_4.txt @@ -0,0 +1 @@ +L. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_6/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..df4d2f0aa0d05d8b2d2b166031cec14855a43816 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_6/order_0.txt @@ -0,0 +1 @@ +N. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_6/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b29537478cfec01d43434ac400bba0b56384016 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_6/order_1.txt @@ -0,0 +1 @@ +CONTENE_FILRER. \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_6/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f05b7a8828e46a1827483cb5c051b455ca169c7c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_6/order_2.txt @@ -0,0 +1 @@ +O. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_6/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f05b7a8828e46a1827483cb5c051b455ca169c7c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_6/order_3.txt @@ -0,0 +1 @@ +O. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_6/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..74bd86004159ceff1e4c64cd19f69ae28ab401df --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_6/order_4.txt @@ -0,0 +1 @@ +M. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_7/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..67e1be4be039844f264ce66827a12f1bc0793074 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_7/order_0.txt @@ -0,0 +1 @@ +F. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_7/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c2b5e523a34a6bf76d19098a45517cfcd09c9072 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_7/order_1.txt @@ -0,0 +1 @@ +H. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_7/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c2b5e523a34a6bf76d19098a45517cfcd09c9072 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_7/order_2.txt @@ -0,0 +1 @@ +H. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_7/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c2b5e523a34a6bf76d19098a45517cfcd09c9072 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_7/order_3.txt @@ -0,0 +1 @@ +H. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_7/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c2b5e523a34a6bf76d19098a45517cfcd09c9072 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_7/order_4.txt @@ -0,0 +1 @@ +H. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_8/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..693b5c71027d3e30e3ab963c96d7409907cd7811 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_8/order_0.txt @@ -0,0 +1 @@ +J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_8/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..693b5c71027d3e30e3ab963c96d7409907cd7811 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_8/order_1.txt @@ -0,0 +1 @@ +J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_8/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..693b5c71027d3e30e3ab963c96d7409907cd7811 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_8/order_2.txt @@ -0,0 +1 @@ +J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_8/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..693b5c71027d3e30e3ab963c96d7409907cd7811 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_8/order_3.txt @@ -0,0 +1 @@ +J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_8/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..693b5c71027d3e30e3ab963c96d7409907cd7811 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_8/order_4.txt @@ -0,0 +1 @@ +J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_9/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0ec660f1d4f0c63a63acfa38b8b7142b314802ec --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_9/order_0.txt @@ -0,0 +1 @@ +G. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_9/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..384f35990d0dc48c9b3ec0e7a5424e4e7801fd05 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_9/order_1.txt @@ -0,0 +1 @@ +F. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_9/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..384f35990d0dc48c9b3ec0e7a5424e4e7801fd05 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_9/order_2.txt @@ -0,0 +1 @@ +F. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_9/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..384f35990d0dc48c9b3ec0e7a5424e4e7801fd05 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_9/order_3.txt @@ -0,0 +1 @@ +F. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_9/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..384f35990d0dc48c9b3ec0e7a5424e4e7801fd05 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_1/sample_9/order_4.txt @@ -0,0 +1 @@ +F. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_1/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f2a2928633a2c7004301f9fd2a2e46809a88675e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_1/order_0.txt @@ -0,0 +1 @@ +G. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_1/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..bac18936ec1027159fe470e42fbd631e4ecb97ff --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_1/order_1.txt @@ -0,0 +1 @@ +F. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_1/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..bd5cfea4e0e325df9ace67f548534c5b815185c5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_1/order_2.txt @@ -0,0 +1 @@ +I. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_1/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..bac18936ec1027159fe470e42fbd631e4ecb97ff --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_1/order_3.txt @@ -0,0 +1 @@ +F. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_1/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..bd5cfea4e0e325df9ace67f548534c5b815185c5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_1/order_4.txt @@ -0,0 +1 @@ +I. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_10/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..df794401fc59db930b5a360374ce899b74a05c44 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_10/order_0.txt @@ -0,0 +1 @@ +A. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_10/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..df794401fc59db930b5a360374ce899b74a05c44 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_10/order_1.txt @@ -0,0 +1 @@ +A. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_10/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..df794401fc59db930b5a360374ce899b74a05c44 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_10/order_2.txt @@ -0,0 +1 @@ +A. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_10/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..49ccbbff2467c29135cb108bd90e4fb567ec4f3b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_10/order_3.txt @@ -0,0 +1 @@ +C. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_10/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..78e73a8947e4fad4f25d4b47ff2492c457d8ef2a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_10/order_4.txt @@ -0,0 +1 @@ +B. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_11/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4174098b8d6f56ad482d31fa503d882c0e2bca5c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_11/order_0.txt @@ -0,0 +1 @@ +H. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_11/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4174098b8d6f56ad482d31fa503d882c0e2bca5c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_11/order_1.txt @@ -0,0 +1 @@ +H. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_11/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4174098b8d6f56ad482d31fa503d882c0e2bca5c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_11/order_2.txt @@ -0,0 +1 @@ +H. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_11/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4174098b8d6f56ad482d31fa503d882c0e2bca5c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_11/order_3.txt @@ -0,0 +1 @@ +H. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_11/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4174098b8d6f56ad482d31fa503d882c0e2bca5c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_11/order_4.txt @@ -0,0 +1 @@ +H. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_12/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c57e8010a81267d967e1058c773df241c65a274d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_12/order_0.txt @@ -0,0 +1 @@ +M. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_12/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c57e8010a81267d967e1058c773df241c65a274d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_12/order_1.txt @@ -0,0 +1 @@ +M. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_12/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c57e8010a81267d967e1058c773df241c65a274d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_12/order_2.txt @@ -0,0 +1 @@ +M. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_12/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c57e8010a81267d967e1058c773df241c65a274d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_12/order_3.txt @@ -0,0 +1 @@ +M. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_12/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c57e8010a81267d967e1058c773df241c65a274d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_12/order_4.txt @@ -0,0 +1 @@ +M. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_13/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..76ca4522ec267ad87de9f51ad1c957af47812051 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_13/order_0.txt @@ -0,0 +1 @@ +D. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_13/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b29537478cfec01d43434ac400bba0b56384016 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_13/order_1.txt @@ -0,0 +1 @@ +CONTENE_FILRER. \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_13/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b69df92f3e4ae537d548eadd49a8be18257e3ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_13/order_2.txt @@ -0,0 +1 @@ +A. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_13/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b69df92f3e4ae537d548eadd49a8be18257e3ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_13/order_3.txt @@ -0,0 +1 @@ +A. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_13/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..76ca4522ec267ad87de9f51ad1c957af47812051 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_13/order_4.txt @@ -0,0 +1 @@ +D. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_14/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ce30660831f35a2a34207cded226e9a328d85947 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_14/order_0.txt @@ -0,0 +1 @@ +K. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_14/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..39595ced9c5dbcc8ddeab8a077bd5e13e94cd355 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_14/order_1.txt @@ -0,0 +1 @@ +O. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_14/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..39595ced9c5dbcc8ddeab8a077bd5e13e94cd355 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_14/order_2.txt @@ -0,0 +1 @@ +O. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_14/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a86bd1acc5b64df55dbe0b368aeb49a8f6eb1767 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_14/order_3.txt @@ -0,0 +1 @@ +L. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_14/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..39595ced9c5dbcc8ddeab8a077bd5e13e94cd355 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_14/order_4.txt @@ -0,0 +1 @@ +O. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_15/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1109540b5af320bca7cf76ca77ac6b758f159806 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_15/order_0.txt @@ -0,0 +1 @@ +E. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_15/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1109540b5af320bca7cf76ca77ac6b758f159806 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_15/order_1.txt @@ -0,0 +1 @@ +E. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_15/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1109540b5af320bca7cf76ca77ac6b758f159806 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_15/order_2.txt @@ -0,0 +1 @@ +E. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_15/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f64fa0d326b4861ef9b8283f17c9abee9db7035 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_15/order_3.txt @@ -0,0 +1 @@ +A. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_15/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f64fa0d326b4861ef9b8283f17c9abee9db7035 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_15/order_4.txt @@ -0,0 +1 @@ +A. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_16/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_16/order_0.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_16/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_16/order_1.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_16/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_16/order_2.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_16/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_16/order_3.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_16/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_16/order_4.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_17/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7d5308076fcca91f62db013641bb581eeef4e55e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_17/order_0.txt @@ -0,0 +1 @@ +B. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_17/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d1ac4ca41921340ec973330ee2c38b3c3d723a05 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_17/order_1.txt @@ -0,0 +1 @@ +C. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_17/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d1ac4ca41921340ec973330ee2c38b3c3d723a05 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_17/order_2.txt @@ -0,0 +1 @@ +C. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_17/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d1ac4ca41921340ec973330ee2c38b3c3d723a05 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_17/order_3.txt @@ -0,0 +1 @@ +C. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_17/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d1ac4ca41921340ec973330ee2c38b3c3d723a05 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_17/order_4.txt @@ -0,0 +1 @@ +C. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_18/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ecab00230c26a12ad6d0795e9a20a5fef5adc790 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_18/order_0.txt @@ -0,0 +1 @@ +M. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_18/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ecab00230c26a12ad6d0795e9a20a5fef5adc790 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_18/order_1.txt @@ -0,0 +1 @@ +M. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_18/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..236feb19b83d8d364a1351faec334d348492c2bc --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_18/order_2.txt @@ -0,0 +1 @@ +K. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_18/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..236feb19b83d8d364a1351faec334d348492c2bc --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_18/order_3.txt @@ -0,0 +1 @@ +K. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_18/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..236feb19b83d8d364a1351faec334d348492c2bc --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_18/order_4.txt @@ -0,0 +1 @@ +K. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_19/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..caf80c652d7b2a9698d0489eb3064827fe945ef5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_19/order_0.txt @@ -0,0 +1 @@ +K. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_19/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_19/order_1.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_19/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_19/order_2.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_19/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_19/order_3.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_19/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_19/order_4.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_2/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..61f7ffb8f54e8b5bdc2133a560152dca8de2f273 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_2/order_0.txt @@ -0,0 +1 @@ +C. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_2/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba52ebad94a8694e71d1c61a1f5a610f6d159ad4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_2/order_1.txt @@ -0,0 +1 @@ +B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_2/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba52ebad94a8694e71d1c61a1f5a610f6d159ad4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_2/order_2.txt @@ -0,0 +1 @@ +B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_2/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..61f7ffb8f54e8b5bdc2133a560152dca8de2f273 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_2/order_3.txt @@ -0,0 +1 @@ +C. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_2/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..61f7ffb8f54e8b5bdc2133a560152dca8de2f273 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_2/order_4.txt @@ -0,0 +1 @@ +C. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_20/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..93f07f129465202429a811982c4081a4d460eaef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_20/order_0.txt @@ -0,0 +1 @@ +A. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_20/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..93f07f129465202429a811982c4081a4d460eaef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_20/order_1.txt @@ -0,0 +1 @@ +A. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_20/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..93f07f129465202429a811982c4081a4d460eaef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_20/order_2.txt @@ -0,0 +1 @@ +A. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_20/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..93f07f129465202429a811982c4081a4d460eaef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_20/order_3.txt @@ -0,0 +1 @@ +A. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_20/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b0ea1a9cf7c09f578a3397d950ef255073bec7de --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_20/order_4.txt @@ -0,0 +1 @@ +C. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_3/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..84040518fdd8e6ffc996a017ae225126391adf40 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_3/order_0.txt @@ -0,0 +1 @@ +M. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_3/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..84040518fdd8e6ffc996a017ae225126391adf40 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_3/order_1.txt @@ -0,0 +1 @@ +M. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_3/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..cea0ef33c2fc9d542c68187afdc1af7f6da3b292 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_3/order_2.txt @@ -0,0 +1 @@ +O. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_3/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cea0ef33c2fc9d542c68187afdc1af7f6da3b292 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_3/order_3.txt @@ -0,0 +1 @@ +O. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_3/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..cea0ef33c2fc9d542c68187afdc1af7f6da3b292 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_3/order_4.txt @@ -0,0 +1 @@ +O. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_4/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6cbe6c12444ee3a56c4e374859f0ab4960805fed --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_4/order_0.txt @@ -0,0 +1 @@ +B. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_4/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6cbe6c12444ee3a56c4e374859f0ab4960805fed --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_4/order_1.txt @@ -0,0 +1 @@ +B. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_4/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..337a8cf50d091b6b5ecdc3dc2ec918ab34347c3c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_4/order_2.txt @@ -0,0 +1 @@ +D. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_4/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..337a8cf50d091b6b5ecdc3dc2ec918ab34347c3c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_4/order_3.txt @@ -0,0 +1 @@ +D. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_4/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..337a8cf50d091b6b5ecdc3dc2ec918ab34347c3c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_4/order_4.txt @@ -0,0 +1 @@ +D. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_5/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a06d7d0ca7d74102d3b9ce2351bb405e30a4e4f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_5/order_0.txt @@ -0,0 +1 @@ +B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_5/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a06d7d0ca7d74102d3b9ce2351bb405e30a4e4f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_5/order_1.txt @@ -0,0 +1 @@ +B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_5/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9574b0a41522c19a313f28691f9380d3619ac68d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_5/order_2.txt @@ -0,0 +1 @@ +C. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_5/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a06d7d0ca7d74102d3b9ce2351bb405e30a4e4f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_5/order_3.txt @@ -0,0 +1 @@ +B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_5/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a06d7d0ca7d74102d3b9ce2351bb405e30a4e4f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_5/order_4.txt @@ -0,0 +1 @@ +B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_6/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a154c43202526d29615c1cba44867122477a0ac5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_6/order_0.txt @@ -0,0 +1 @@ +F. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_6/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b922c84801117f9f9b34ab1a24ac1c3401811dd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_6/order_1.txt @@ -0,0 +1 @@ +G. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_6/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b922c84801117f9f9b34ab1a24ac1c3401811dd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_6/order_2.txt @@ -0,0 +1 @@ +G. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_6/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a154c43202526d29615c1cba44867122477a0ac5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_6/order_3.txt @@ -0,0 +1 @@ +F. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_6/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba00fc0cc6bcc2312fbec141c81fad0d2fe9ffb5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_6/order_4.txt @@ -0,0 +1 @@ +J. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_7/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c9280591fab665aea606c62faf687f35ec17014a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_7/order_0.txt @@ -0,0 +1 @@ +N. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_7/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c9280591fab665aea606c62faf687f35ec17014a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_7/order_1.txt @@ -0,0 +1 @@ +N. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_7/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c9280591fab665aea606c62faf687f35ec17014a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_7/order_2.txt @@ -0,0 +1 @@ +N. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_7/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c9280591fab665aea606c62faf687f35ec17014a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_7/order_3.txt @@ -0,0 +1 @@ +N. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_7/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c9280591fab665aea606c62faf687f35ec17014a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_7/order_4.txt @@ -0,0 +1 @@ +N. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_8/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2bc6cf23d90b1b6e24f4327190e7de06b355588d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_8/order_0.txt @@ -0,0 +1 @@ +E. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_8/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad2c32f659858ad34579205ef6266e84f272e26d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_8/order_1.txt @@ -0,0 +1 @@ +A. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_8/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad2c32f659858ad34579205ef6266e84f272e26d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_8/order_2.txt @@ -0,0 +1 @@ +A. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_8/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad2c32f659858ad34579205ef6266e84f272e26d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_8/order_3.txt @@ -0,0 +1 @@ +A. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_8/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2bc6cf23d90b1b6e24f4327190e7de06b355588d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_8/order_4.txt @@ -0,0 +1 @@ +E. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_9/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f64fa0d326b4861ef9b8283f17c9abee9db7035 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_9/order_0.txt @@ -0,0 +1 @@ +A. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_9/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f64fa0d326b4861ef9b8283f17c9abee9db7035 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_9/order_1.txt @@ -0,0 +1 @@ +A. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_9/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f64fa0d326b4861ef9b8283f17c9abee9db7035 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_9/order_2.txt @@ -0,0 +1 @@ +A. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_9/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f64fa0d326b4861ef9b8283f17c9abee9db7035 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_9/order_3.txt @@ -0,0 +1 @@ +A. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_9/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f64fa0d326b4861ef9b8283f17c9abee9db7035 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_2/sample_9/order_4.txt @@ -0,0 +1 @@ +A. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_1/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..caf80c652d7b2a9698d0489eb3064827fe945ef5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_1/order_0.txt @@ -0,0 +1 @@ +K. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_1/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..caf80c652d7b2a9698d0489eb3064827fe945ef5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_1/order_1.txt @@ -0,0 +1 @@ +K. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_1/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..caf80c652d7b2a9698d0489eb3064827fe945ef5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_1/order_2.txt @@ -0,0 +1 @@ +K. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_1/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..caf80c652d7b2a9698d0489eb3064827fe945ef5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_1/order_3.txt @@ -0,0 +1 @@ +K. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_1/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..caf80c652d7b2a9698d0489eb3064827fe945ef5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_1/order_4.txt @@ -0,0 +1 @@ +K. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_10/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b5f2e55eda95f15335f5cd63d7eb75fd8414c797 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_10/order_0.txt @@ -0,0 +1 @@ +F. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_10/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f8233adbc15dffd0f3c2ea80d25e54f153feb51e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_10/order_1.txt @@ -0,0 +1 @@ +G. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_10/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f8233adbc15dffd0f3c2ea80d25e54f153feb51e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_10/order_2.txt @@ -0,0 +1 @@ +G. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_10/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b5f2e55eda95f15335f5cd63d7eb75fd8414c797 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_10/order_3.txt @@ -0,0 +1 @@ +F. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_10/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b5f2e55eda95f15335f5cd63d7eb75fd8414c797 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_10/order_4.txt @@ -0,0 +1 @@ +F. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_11/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fed83117e891372f464f3c40ccde41cfb16e5c8a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_11/order_0.txt @@ -0,0 +1 @@ +A. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_11/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fed83117e891372f464f3c40ccde41cfb16e5c8a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_11/order_1.txt @@ -0,0 +1 @@ +A. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_11/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..fed83117e891372f464f3c40ccde41cfb16e5c8a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_11/order_2.txt @@ -0,0 +1 @@ +A. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_11/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..fed83117e891372f464f3c40ccde41cfb16e5c8a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_11/order_3.txt @@ -0,0 +1 @@ +A. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_11/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..fed83117e891372f464f3c40ccde41cfb16e5c8a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_11/order_4.txt @@ -0,0 +1 @@ +A. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_12/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..93f07f129465202429a811982c4081a4d460eaef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_12/order_0.txt @@ -0,0 +1 @@ +A. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_12/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..50660968897f358802b8ad8147be24df49ba96df --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_12/order_1.txt @@ -0,0 +1 @@ +E. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_12/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..93f07f129465202429a811982c4081a4d460eaef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_12/order_2.txt @@ -0,0 +1 @@ +A. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_12/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..93f07f129465202429a811982c4081a4d460eaef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_12/order_3.txt @@ -0,0 +1 @@ +A. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_12/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..93f07f129465202429a811982c4081a4d460eaef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_12/order_4.txt @@ -0,0 +1 @@ +A. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_13/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6d67bde6abfea7041945c1d7af6bccc131b17bbc --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_13/order_0.txt @@ -0,0 +1 @@ +N. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_13/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..450eca0b704a8cb79defb994f00ce0109c00cf91 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_13/order_1.txt @@ -0,0 +1 @@ +M. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_13/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..450eca0b704a8cb79defb994f00ce0109c00cf91 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_13/order_2.txt @@ -0,0 +1 @@ +M. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_13/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..450eca0b704a8cb79defb994f00ce0109c00cf91 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_13/order_3.txt @@ -0,0 +1 @@ +M. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_13/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..450eca0b704a8cb79defb994f00ce0109c00cf91 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_13/order_4.txt @@ -0,0 +1 @@ +M. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_14/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c72d16f4049489d6a5986ee95c283482b65e8a29 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_14/order_0.txt @@ -0,0 +1 @@ +M. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_14/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..939b93d185a7aab7fbead0bd24d18a54824341e4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_14/order_1.txt @@ -0,0 +1 @@ +O. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_14/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..939b93d185a7aab7fbead0bd24d18a54824341e4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_14/order_2.txt @@ -0,0 +1 @@ +O. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_14/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..939b93d185a7aab7fbead0bd24d18a54824341e4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_14/order_3.txt @@ -0,0 +1 @@ +O. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_14/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..939b93d185a7aab7fbead0bd24d18a54824341e4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_14/order_4.txt @@ -0,0 +1 @@ +O. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_15/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..df7fd34eeab9a6c1cb128bc1141572c2ef5b95c2 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_15/order_0.txt @@ -0,0 +1 @@ +B. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_15/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..88c6cde00a2062fc41230f0c8c5b0d074e2ae428 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_15/order_1.txt @@ -0,0 +1 @@ +C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_15/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..88c6cde00a2062fc41230f0c8c5b0d074e2ae428 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_15/order_2.txt @@ -0,0 +1 @@ +C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_15/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..88c6cde00a2062fc41230f0c8c5b0d074e2ae428 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_15/order_3.txt @@ -0,0 +1 @@ +C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_15/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..88c6cde00a2062fc41230f0c8c5b0d074e2ae428 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_15/order_4.txt @@ -0,0 +1 @@ +C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_16/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4237cd980cd839273a83cb7b2b85921b37434186 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_16/order_0.txt @@ -0,0 +1 @@ +F. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_16/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4237cd980cd839273a83cb7b2b85921b37434186 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_16/order_1.txt @@ -0,0 +1 @@ +F. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_16/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4237cd980cd839273a83cb7b2b85921b37434186 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_16/order_2.txt @@ -0,0 +1 @@ +F. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_16/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..0f72e029dd84aff08de2ce74e9782de0899339ec --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_16/order_3.txt @@ -0,0 +1 @@ +J. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_16/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0f72e029dd84aff08de2ce74e9782de0899339ec --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_16/order_4.txt @@ -0,0 +1 @@ +J. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_17/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ec714eecffd9c487f25cea09ca08d85719a5f96e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_17/order_0.txt @@ -0,0 +1 @@ +G. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_17/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0c1fbfc862f27a0d89c7e7c85e49f9ce39eadd2a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_17/order_1.txt @@ -0,0 +1 @@ +H. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_17/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ec714eecffd9c487f25cea09ca08d85719a5f96e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_17/order_2.txt @@ -0,0 +1 @@ +G. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_17/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..0c1fbfc862f27a0d89c7e7c85e49f9ce39eadd2a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_17/order_3.txt @@ -0,0 +1 @@ +H. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_17/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0c1fbfc862f27a0d89c7e7c85e49f9ce39eadd2a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_17/order_4.txt @@ -0,0 +1 @@ +H. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_18/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_18/order_0.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_18/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_18/order_1.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_18/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4a02dad6139cd25a61da6e0e39d78531691c76ff --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_18/order_2.txt @@ -0,0 +1 @@ +M. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_18/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_18/order_3.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_18/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_18/order_4.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_19/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_19/order_0.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_19/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_19/order_1.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_19/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b4e1b63089fcad515d8a61751eabedc00193569 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_19/order_2.txt @@ -0,0 +1 @@ +K. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_19/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b4e1b63089fcad515d8a61751eabedc00193569 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_19/order_3.txt @@ -0,0 +1 @@ +K. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_19/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_19/order_4.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_2/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4a68ebfde4b67da1720f3fe97108dd4b2d5c4a40 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_2/order_0.txt @@ -0,0 +1 @@ +O. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_2/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e0dbb6dee2a2098b51f920c05b4ac3cdd907b093 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_2/order_1.txt @@ -0,0 +1 @@ +N. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_2/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e0dbb6dee2a2098b51f920c05b4ac3cdd907b093 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_2/order_2.txt @@ -0,0 +1 @@ +N. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_2/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e0dbb6dee2a2098b51f920c05b4ac3cdd907b093 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_2/order_3.txt @@ -0,0 +1 @@ +N. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_2/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e0dbb6dee2a2098b51f920c05b4ac3cdd907b093 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_2/order_4.txt @@ -0,0 +1 @@ +N. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_20/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f72bef47dbc2768994153539d80421aef99397ba --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_20/order_0.txt @@ -0,0 +1 @@ +O. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_20/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a54ab342df6381550d14fb7f136581e3235fea5a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_20/order_1.txt @@ -0,0 +1 @@ +N. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_20/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7973f8fdcade2def238f70b25c564e76699783b8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_20/order_2.txt @@ -0,0 +1 @@ +L. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_20/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7973f8fdcade2def238f70b25c564e76699783b8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_20/order_3.txt @@ -0,0 +1 @@ +L. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_20/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f72bef47dbc2768994153539d80421aef99397ba --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_20/order_4.txt @@ -0,0 +1 @@ +O. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_3/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ff2b1f1400c4f731cfdb1119268da254010e80c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_3/order_0.txt @@ -0,0 +1 @@ +E. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_3/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ff2b1f1400c4f731cfdb1119268da254010e80c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_3/order_1.txt @@ -0,0 +1 @@ +E. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_3/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ff2b1f1400c4f731cfdb1119268da254010e80c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_3/order_2.txt @@ -0,0 +1 @@ +E. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_3/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ff2b1f1400c4f731cfdb1119268da254010e80c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_3/order_3.txt @@ -0,0 +1 @@ +E. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_3/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ff2b1f1400c4f731cfdb1119268da254010e80c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_3/order_4.txt @@ -0,0 +1 @@ +E. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_4/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c8924966fb5d035b25e00e268f222224e66cb2be --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_4/order_0.txt @@ -0,0 +1 @@ +G. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_4/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c8924966fb5d035b25e00e268f222224e66cb2be --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_4/order_1.txt @@ -0,0 +1 @@ +G. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_4/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c8924966fb5d035b25e00e268f222224e66cb2be --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_4/order_2.txt @@ -0,0 +1 @@ +G. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_4/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c8924966fb5d035b25e00e268f222224e66cb2be --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_4/order_3.txt @@ -0,0 +1 @@ +G. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_4/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c8924966fb5d035b25e00e268f222224e66cb2be --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_4/order_4.txt @@ -0,0 +1 @@ +G. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_5/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6491783a4c60c11c9a1e52b16beffac9244e67d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_5/order_0.txt @@ -0,0 +1 @@ +O. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_5/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6491783a4c60c11c9a1e52b16beffac9244e67d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_5/order_1.txt @@ -0,0 +1 @@ +O. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_5/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6491783a4c60c11c9a1e52b16beffac9244e67d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_5/order_2.txt @@ -0,0 +1 @@ +O. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_5/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6491783a4c60c11c9a1e52b16beffac9244e67d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_5/order_3.txt @@ -0,0 +1 @@ +O. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_5/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6491783a4c60c11c9a1e52b16beffac9244e67d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_5/order_4.txt @@ -0,0 +1 @@ +O. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_6/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..398d2fb5b465d779d31a4b9420edf8557bccf2f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_6/order_0.txt @@ -0,0 +1 @@ +C. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_6/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..398d2fb5b465d779d31a4b9420edf8557bccf2f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_6/order_1.txt @@ -0,0 +1 @@ +C. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_6/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..398d2fb5b465d779d31a4b9420edf8557bccf2f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_6/order_2.txt @@ -0,0 +1 @@ +C. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_6/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b29537478cfec01d43434ac400bba0b56384016 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_6/order_3.txt @@ -0,0 +1 @@ +CONTENE_FILRER. \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_6/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f64fa0d326b4861ef9b8283f17c9abee9db7035 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_6/order_4.txt @@ -0,0 +1 @@ +A. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_7/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..766939aaaf9d2f33a29eb103d53d884640f16d6b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_7/order_0.txt @@ -0,0 +1 @@ +M. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_7/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..44d18ebe03fbb4a0d1648d7a5fcb957f5b90724f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_7/order_1.txt @@ -0,0 +1 @@ +L. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_7/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..44d18ebe03fbb4a0d1648d7a5fcb957f5b90724f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_7/order_2.txt @@ -0,0 +1 @@ +L. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_7/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..44d18ebe03fbb4a0d1648d7a5fcb957f5b90724f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_7/order_3.txt @@ -0,0 +1 @@ +L. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_7/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..44d18ebe03fbb4a0d1648d7a5fcb957f5b90724f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_7/order_4.txt @@ -0,0 +1 @@ +L. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_8/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7973f8fdcade2def238f70b25c564e76699783b8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_8/order_0.txt @@ -0,0 +1 @@ +L. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_8/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7973f8fdcade2def238f70b25c564e76699783b8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_8/order_1.txt @@ -0,0 +1 @@ +L. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_8/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..84040518fdd8e6ffc996a017ae225126391adf40 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_8/order_2.txt @@ -0,0 +1 @@ +M. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_8/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f2a53fe2503e9a82622b6fa3f3aaf492e5ae79b8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_8/order_3.txt @@ -0,0 +1 @@ +O. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_8/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..84040518fdd8e6ffc996a017ae225126391adf40 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_8/order_4.txt @@ -0,0 +1 @@ +M. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_9/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..50f7bcbf7ab38ec95ab86c7dd20b042b741c2817 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_9/order_0.txt @@ -0,0 +1 @@ +F. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_9/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..50f7bcbf7ab38ec95ab86c7dd20b042b741c2817 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_9/order_1.txt @@ -0,0 +1 @@ +F. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_9/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..50f7bcbf7ab38ec95ab86c7dd20b042b741c2817 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_9/order_2.txt @@ -0,0 +1 @@ +F. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_9/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..043750ba8be3608c7df5257f16bc06e3142595b0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_9/order_3.txt @@ -0,0 +1 @@ +J. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_9/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..50f7bcbf7ab38ec95ab86c7dd20b042b741c2817 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/CoT/length_3/sample_9/order_4.txt @@ -0,0 +1 @@ +F. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_1/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..71bd126bff050ead46a380ac3356ebb8749d923e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_1/order_0.txt @@ -0,0 +1 @@ +K. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_1/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..bb719ce6dd764837fea876a8d742c88f0c819912 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_1/order_1.txt @@ -0,0 +1 @@ +O. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_1/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c19b723e4927ca12fdd55a5f537ef0554730637 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_1/order_2.txt @@ -0,0 +1 @@ +L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_1/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c19b723e4927ca12fdd55a5f537ef0554730637 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_1/order_3.txt @@ -0,0 +1 @@ +L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_1/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c19b723e4927ca12fdd55a5f537ef0554730637 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_1/order_4.txt @@ -0,0 +1 @@ +L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_10/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..69202a077a3d75358e84ea94cb321f8f591ce9cc --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_10/order_0.txt @@ -0,0 +1 @@ +G. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_10/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..69202a077a3d75358e84ea94cb321f8f591ce9cc --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_10/order_1.txt @@ -0,0 +1 @@ +G. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_10/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..69202a077a3d75358e84ea94cb321f8f591ce9cc --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_10/order_2.txt @@ -0,0 +1 @@ +G. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_10/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..033b6976cccdb391c300eed6649e0a418c776eb9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_10/order_3.txt @@ -0,0 +1 @@ +I. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_10/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..033b6976cccdb391c300eed6649e0a418c776eb9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_10/order_4.txt @@ -0,0 +1 @@ +I. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_11/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0fe4074b23906794c3174aafcbf47bd1fbe2a1f8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_11/order_0.txt @@ -0,0 +1 @@ +F. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_11/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0fe4074b23906794c3174aafcbf47bd1fbe2a1f8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_11/order_1.txt @@ -0,0 +1 @@ +F. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_11/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a55b502972694df70071342dfdd391882f526537 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_11/order_2.txt @@ -0,0 +1 @@ +H. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_11/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..0fe4074b23906794c3174aafcbf47bd1fbe2a1f8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_11/order_3.txt @@ -0,0 +1 @@ +F. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_11/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0fe4074b23906794c3174aafcbf47bd1fbe2a1f8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_11/order_4.txt @@ -0,0 +1 @@ +F. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_12/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..28da04de2eecc0b3436d3a52ef4ad43f8852e144 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_12/order_0.txt @@ -0,0 +1 @@ +I. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_12/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cedfb2c0910a9ff50a6fc3937253b6bd8b63a5d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_12/order_1.txt @@ -0,0 +1 @@ +G. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_12/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cedfb2c0910a9ff50a6fc3937253b6bd8b63a5d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_12/order_2.txt @@ -0,0 +1 @@ +G. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_12/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cedfb2c0910a9ff50a6fc3937253b6bd8b63a5d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_12/order_3.txt @@ -0,0 +1 @@ +G. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_12/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..76dda8de05110b13966ae5e6f3900d500f6d05eb --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_12/order_4.txt @@ -0,0 +1 @@ +F. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_13/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cc819aa574392d7d7507c98764deb0089020a35 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_13/order_0.txt @@ -0,0 +1 @@ +F. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_13/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f64e5a7ed4fd9e274e574ef68056e991f821ad3b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_13/order_1.txt @@ -0,0 +1 @@ +H. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_13/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f64e5a7ed4fd9e274e574ef68056e991f821ad3b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_13/order_2.txt @@ -0,0 +1 @@ +H. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_13/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6dc01f6af50983461439ef6ed20a6fc3f1fbbe1e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_13/order_3.txt @@ -0,0 +1 @@ +I. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_13/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6dc01f6af50983461439ef6ed20a6fc3f1fbbe1e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_13/order_4.txt @@ -0,0 +1 @@ +I. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_14/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e97b1e5a07d640a6b0bc360874f848a16dfd4611 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_14/order_0.txt @@ -0,0 +1 @@ +K. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_14/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e97b1e5a07d640a6b0bc360874f848a16dfd4611 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_14/order_1.txt @@ -0,0 +1 @@ +K. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_14/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e97b1e5a07d640a6b0bc360874f848a16dfd4611 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_14/order_2.txt @@ -0,0 +1 @@ +K. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_14/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a56ff875efd313cf02ac289f14cb0377e559a167 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_14/order_3.txt @@ -0,0 +1 @@ +M. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_14/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a56ff875efd313cf02ac289f14cb0377e559a167 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_14/order_4.txt @@ -0,0 +1 @@ +M. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_15/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_15/order_0.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_15/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_15/order_1.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_15/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_15/order_2.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_15/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_15/order_3.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_15/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_15/order_4.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_16/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a88b89d90b7808511acfff8cb8907a798bfce2bf --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_16/order_0.txt @@ -0,0 +1 @@ +B. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_16/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a88b89d90b7808511acfff8cb8907a798bfce2bf --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_16/order_1.txt @@ -0,0 +1 @@ +B. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_16/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..02421bddf2802240d7fd16cb53ac1ff5fc2937db --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_16/order_2.txt @@ -0,0 +1 @@ +E. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_16/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a88b89d90b7808511acfff8cb8907a798bfce2bf --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_16/order_3.txt @@ -0,0 +1 @@ +B. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_16/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..02421bddf2802240d7fd16cb53ac1ff5fc2937db --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_16/order_4.txt @@ -0,0 +1 @@ +E. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_17/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..bfa61fa12baaf33c98e718a430e48b0ce40790ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_17/order_0.txt @@ -0,0 +1 @@ +I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_17/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cc819aa574392d7d7507c98764deb0089020a35 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_17/order_1.txt @@ -0,0 +1 @@ +F. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_17/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cc819aa574392d7d7507c98764deb0089020a35 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_17/order_2.txt @@ -0,0 +1 @@ +F. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_17/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cc819aa574392d7d7507c98764deb0089020a35 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_17/order_3.txt @@ -0,0 +1 @@ +F. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_17/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cc819aa574392d7d7507c98764deb0089020a35 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_17/order_4.txt @@ -0,0 +1 @@ +F. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_18/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..beafdfe4e6806eeee4e2c87ec3c2b9d23429c83d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_18/order_0.txt @@ -0,0 +1 @@ +B. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_18/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cf918913473058cd52b94293be01c5c94e03324 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_18/order_1.txt @@ -0,0 +1 @@ +A. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_18/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cf918913473058cd52b94293be01c5c94e03324 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_18/order_2.txt @@ -0,0 +1 @@ +A. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_18/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cf918913473058cd52b94293be01c5c94e03324 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_18/order_3.txt @@ -0,0 +1 @@ +A. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_18/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cf918913473058cd52b94293be01c5c94e03324 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_18/order_4.txt @@ -0,0 +1 @@ +A. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_19/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_19/order_0.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_19/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_19/order_1.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_19/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_19/order_2.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_19/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_19/order_3.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_19/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_19/order_4.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_2/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..02421bddf2802240d7fd16cb53ac1ff5fc2937db --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_2/order_0.txt @@ -0,0 +1 @@ +E. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_2/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..259f2e13d3186d37f145399f7eadc25006f92750 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_2/order_1.txt @@ -0,0 +1 @@ +D. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_2/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..259f2e13d3186d37f145399f7eadc25006f92750 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_2/order_2.txt @@ -0,0 +1 @@ +D. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_2/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..259f2e13d3186d37f145399f7eadc25006f92750 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_2/order_3.txt @@ -0,0 +1 @@ +D. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_2/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..259f2e13d3186d37f145399f7eadc25006f92750 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_2/order_4.txt @@ -0,0 +1 @@ +D. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_20/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5232a3af3c291d3e68d5cf80b8d40b4bca541cd4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_20/order_0.txt @@ -0,0 +1 @@ +A. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_20/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d987bc2d531e93dfaedbc698b4d56e24efaa78b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_20/order_1.txt @@ -0,0 +1 @@ +D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_20/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d987bc2d531e93dfaedbc698b4d56e24efaa78b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_20/order_2.txt @@ -0,0 +1 @@ +D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_20/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d987bc2d531e93dfaedbc698b4d56e24efaa78b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_20/order_3.txt @@ -0,0 +1 @@ +D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_20/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5232a3af3c291d3e68d5cf80b8d40b4bca541cd4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_20/order_4.txt @@ -0,0 +1 @@ +A. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_3/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..67e1be4be039844f264ce66827a12f1bc0793074 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_3/order_0.txt @@ -0,0 +1 @@ +F. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_3/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..67e1be4be039844f264ce66827a12f1bc0793074 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_3/order_1.txt @@ -0,0 +1 @@ +F. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_3/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..67e1be4be039844f264ce66827a12f1bc0793074 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_3/order_2.txt @@ -0,0 +1 @@ +F. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_3/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9d8d99d95007f50227c2e98803276c5aae0f2738 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_3/order_3.txt @@ -0,0 +1 @@ +H. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_3/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..67e1be4be039844f264ce66827a12f1bc0793074 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_3/order_4.txt @@ -0,0 +1 @@ +F. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_4/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..87f7e79c16f9fac8b9ca168a8d33744137a201d6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_4/order_0.txt @@ -0,0 +1 @@ +K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_4/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..87f7e79c16f9fac8b9ca168a8d33744137a201d6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_4/order_1.txt @@ -0,0 +1 @@ +K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_4/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..87f7e79c16f9fac8b9ca168a8d33744137a201d6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_4/order_2.txt @@ -0,0 +1 @@ +K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_4/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..87f7e79c16f9fac8b9ca168a8d33744137a201d6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_4/order_3.txt @@ -0,0 +1 @@ +K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_4/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..87f7e79c16f9fac8b9ca168a8d33744137a201d6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_4/order_4.txt @@ -0,0 +1 @@ +K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_5/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..618eef651c5d5adfa784840551836610ee9825d0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_5/order_0.txt @@ -0,0 +1 @@ +N. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_5/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d44620b08fb34b5a19f2f46ce51467304f010018 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_5/order_1.txt @@ -0,0 +1 @@ +L. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_5/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d44620b08fb34b5a19f2f46ce51467304f010018 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_5/order_2.txt @@ -0,0 +1 @@ +L. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_5/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d44620b08fb34b5a19f2f46ce51467304f010018 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_5/order_3.txt @@ -0,0 +1 @@ +L. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_5/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d44620b08fb34b5a19f2f46ce51467304f010018 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_5/order_4.txt @@ -0,0 +1 @@ +L. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_6/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..df4d2f0aa0d05d8b2d2b166031cec14855a43816 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_6/order_0.txt @@ -0,0 +1 @@ +N. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_6/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..df4d2f0aa0d05d8b2d2b166031cec14855a43816 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_6/order_1.txt @@ -0,0 +1 @@ +N. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_6/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f05b7a8828e46a1827483cb5c051b455ca169c7c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_6/order_2.txt @@ -0,0 +1 @@ +O. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_6/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f05b7a8828e46a1827483cb5c051b455ca169c7c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_6/order_3.txt @@ -0,0 +1 @@ +O. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_6/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f05b7a8828e46a1827483cb5c051b455ca169c7c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_6/order_4.txt @@ -0,0 +1 @@ +O. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_7/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..67e1be4be039844f264ce66827a12f1bc0793074 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_7/order_0.txt @@ -0,0 +1 @@ +F. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_7/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..67e1be4be039844f264ce66827a12f1bc0793074 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_7/order_1.txt @@ -0,0 +1 @@ +F. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_7/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c2b5e523a34a6bf76d19098a45517cfcd09c9072 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_7/order_2.txt @@ -0,0 +1 @@ +H. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_7/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c2b5e523a34a6bf76d19098a45517cfcd09c9072 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_7/order_3.txt @@ -0,0 +1 @@ +H. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_7/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c2b5e523a34a6bf76d19098a45517cfcd09c9072 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_7/order_4.txt @@ -0,0 +1 @@ +H. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_8/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..693b5c71027d3e30e3ab963c96d7409907cd7811 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_8/order_0.txt @@ -0,0 +1 @@ +J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_8/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..693b5c71027d3e30e3ab963c96d7409907cd7811 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_8/order_1.txt @@ -0,0 +1 @@ +J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_8/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..693b5c71027d3e30e3ab963c96d7409907cd7811 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_8/order_2.txt @@ -0,0 +1 @@ +J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_8/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..693b5c71027d3e30e3ab963c96d7409907cd7811 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_8/order_3.txt @@ -0,0 +1 @@ +J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_8/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..693b5c71027d3e30e3ab963c96d7409907cd7811 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_8/order_4.txt @@ -0,0 +1 @@ +J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_9/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..0ec660f1d4f0c63a63acfa38b8b7142b314802ec --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_9/order_0.txt @@ -0,0 +1 @@ +G. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_9/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..384f35990d0dc48c9b3ec0e7a5424e4e7801fd05 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_9/order_1.txt @@ -0,0 +1 @@ +F. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_9/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..384f35990d0dc48c9b3ec0e7a5424e4e7801fd05 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_9/order_2.txt @@ -0,0 +1 @@ +F. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_9/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..384f35990d0dc48c9b3ec0e7a5424e4e7801fd05 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_9/order_3.txt @@ -0,0 +1 @@ +F. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_9/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..384f35990d0dc48c9b3ec0e7a5424e4e7801fd05 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_1/sample_9/order_4.txt @@ -0,0 +1 @@ +F. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_1/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f2a2928633a2c7004301f9fd2a2e46809a88675e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_1/order_0.txt @@ -0,0 +1 @@ +G. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_1/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..bac18936ec1027159fe470e42fbd631e4ecb97ff --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_1/order_1.txt @@ -0,0 +1 @@ +F. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_1/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..bac18936ec1027159fe470e42fbd631e4ecb97ff --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_1/order_2.txt @@ -0,0 +1 @@ +F. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_1/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..bac18936ec1027159fe470e42fbd631e4ecb97ff --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_1/order_3.txt @@ -0,0 +1 @@ +F. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_1/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..bac18936ec1027159fe470e42fbd631e4ecb97ff --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_1/order_4.txt @@ -0,0 +1 @@ +F. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_10/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..df794401fc59db930b5a360374ce899b74a05c44 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_10/order_0.txt @@ -0,0 +1 @@ +A. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_10/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..df794401fc59db930b5a360374ce899b74a05c44 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_10/order_1.txt @@ -0,0 +1 @@ +A. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_10/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..49ccbbff2467c29135cb108bd90e4fb567ec4f3b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_10/order_2.txt @@ -0,0 +1 @@ +C. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_10/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..49ccbbff2467c29135cb108bd90e4fb567ec4f3b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_10/order_3.txt @@ -0,0 +1 @@ +C. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_10/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..49ccbbff2467c29135cb108bd90e4fb567ec4f3b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_10/order_4.txt @@ -0,0 +1 @@ +C. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_11/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4174098b8d6f56ad482d31fa503d882c0e2bca5c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_11/order_0.txt @@ -0,0 +1 @@ +H. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_11/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4174098b8d6f56ad482d31fa503d882c0e2bca5c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_11/order_1.txt @@ -0,0 +1 @@ +H. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_11/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d33f08d7299a2d058c712576d8f0d70fa3e97b1a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_11/order_2.txt @@ -0,0 +1 @@ +G. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_11/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4174098b8d6f56ad482d31fa503d882c0e2bca5c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_11/order_3.txt @@ -0,0 +1 @@ +H. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_11/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4174098b8d6f56ad482d31fa503d882c0e2bca5c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_11/order_4.txt @@ -0,0 +1 @@ +H. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_12/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c57e8010a81267d967e1058c773df241c65a274d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_12/order_0.txt @@ -0,0 +1 @@ +M. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_12/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c57e8010a81267d967e1058c773df241c65a274d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_12/order_1.txt @@ -0,0 +1 @@ +M. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_12/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c57e8010a81267d967e1058c773df241c65a274d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_12/order_2.txt @@ -0,0 +1 @@ +M. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_12/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c57e8010a81267d967e1058c773df241c65a274d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_12/order_3.txt @@ -0,0 +1 @@ +M. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_12/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a86bd1acc5b64df55dbe0b368aeb49a8f6eb1767 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_12/order_4.txt @@ -0,0 +1 @@ +L. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_13/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..76ca4522ec267ad87de9f51ad1c957af47812051 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_13/order_0.txt @@ -0,0 +1 @@ +D. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_13/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..76ca4522ec267ad87de9f51ad1c957af47812051 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_13/order_1.txt @@ -0,0 +1 @@ +D. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_13/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b69df92f3e4ae537d548eadd49a8be18257e3ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_13/order_2.txt @@ -0,0 +1 @@ +A. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_13/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b69df92f3e4ae537d548eadd49a8be18257e3ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_13/order_3.txt @@ -0,0 +1 @@ +A. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_13/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b69df92f3e4ae537d548eadd49a8be18257e3ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_13/order_4.txt @@ -0,0 +1 @@ +A. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_14/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ce30660831f35a2a34207cded226e9a328d85947 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_14/order_0.txt @@ -0,0 +1 @@ +K. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_14/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a86bd1acc5b64df55dbe0b368aeb49a8f6eb1767 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_14/order_1.txt @@ -0,0 +1 @@ +L. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_14/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..39595ced9c5dbcc8ddeab8a077bd5e13e94cd355 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_14/order_2.txt @@ -0,0 +1 @@ +O. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_14/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a86bd1acc5b64df55dbe0b368aeb49a8f6eb1767 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_14/order_3.txt @@ -0,0 +1 @@ +L. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_14/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..39595ced9c5dbcc8ddeab8a077bd5e13e94cd355 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_14/order_4.txt @@ -0,0 +1 @@ +O. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_15/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..1109540b5af320bca7cf76ca77ac6b758f159806 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_15/order_0.txt @@ -0,0 +1 @@ +E. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_15/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1109540b5af320bca7cf76ca77ac6b758f159806 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_15/order_1.txt @@ -0,0 +1 @@ +E. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_15/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1109540b5af320bca7cf76ca77ac6b758f159806 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_15/order_2.txt @@ -0,0 +1 @@ +E. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_15/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f64fa0d326b4861ef9b8283f17c9abee9db7035 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_15/order_3.txt @@ -0,0 +1 @@ +A. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_15/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f64fa0d326b4861ef9b8283f17c9abee9db7035 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_15/order_4.txt @@ -0,0 +1 @@ +A. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_16/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_16/order_0.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_16/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_16/order_1.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_16/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_16/order_2.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_16/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_16/order_3.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_16/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4623ca0e93f4df08bfa82fa34ac417b38161c4c4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_16/order_4.txt @@ -0,0 +1 @@ +L. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_17/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7d5308076fcca91f62db013641bb581eeef4e55e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_17/order_0.txt @@ -0,0 +1 @@ +B. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_17/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d1ac4ca41921340ec973330ee2c38b3c3d723a05 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_17/order_1.txt @@ -0,0 +1 @@ +C. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_17/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d1ac4ca41921340ec973330ee2c38b3c3d723a05 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_17/order_2.txt @@ -0,0 +1 @@ +C. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_17/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d1ac4ca41921340ec973330ee2c38b3c3d723a05 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_17/order_3.txt @@ -0,0 +1 @@ +C. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_17/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d1ac4ca41921340ec973330ee2c38b3c3d723a05 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_17/order_4.txt @@ -0,0 +1 @@ +C. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_18/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ecab00230c26a12ad6d0795e9a20a5fef5adc790 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_18/order_0.txt @@ -0,0 +1 @@ +M. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_18/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..236feb19b83d8d364a1351faec334d348492c2bc --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_18/order_1.txt @@ -0,0 +1 @@ +K. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_18/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..236feb19b83d8d364a1351faec334d348492c2bc --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_18/order_2.txt @@ -0,0 +1 @@ +K. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_18/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ecab00230c26a12ad6d0795e9a20a5fef5adc790 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_18/order_3.txt @@ -0,0 +1 @@ +M. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_18/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..236feb19b83d8d364a1351faec334d348492c2bc --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_18/order_4.txt @@ -0,0 +1 @@ +K. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_19/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..caf80c652d7b2a9698d0489eb3064827fe945ef5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_19/order_0.txt @@ -0,0 +1 @@ +K. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_19/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_19/order_1.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_19/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_19/order_2.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_19/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_19/order_3.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_19/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_19/order_4.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_2/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..61f7ffb8f54e8b5bdc2133a560152dca8de2f273 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_2/order_0.txt @@ -0,0 +1 @@ +C. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_2/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba52ebad94a8694e71d1c61a1f5a610f6d159ad4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_2/order_1.txt @@ -0,0 +1 @@ +B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_2/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba52ebad94a8694e71d1c61a1f5a610f6d159ad4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_2/order_2.txt @@ -0,0 +1 @@ +B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_2/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba52ebad94a8694e71d1c61a1f5a610f6d159ad4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_2/order_3.txt @@ -0,0 +1 @@ +B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_2/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..61f7ffb8f54e8b5bdc2133a560152dca8de2f273 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_2/order_4.txt @@ -0,0 +1 @@ +C. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_20/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..93f07f129465202429a811982c4081a4d460eaef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_20/order_0.txt @@ -0,0 +1 @@ +A. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_20/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..93f07f129465202429a811982c4081a4d460eaef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_20/order_1.txt @@ -0,0 +1 @@ +A. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_20/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..93f07f129465202429a811982c4081a4d460eaef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_20/order_2.txt @@ -0,0 +1 @@ +A. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_20/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..93f07f129465202429a811982c4081a4d460eaef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_20/order_3.txt @@ -0,0 +1 @@ +A. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_20/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..93f07f129465202429a811982c4081a4d460eaef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_20/order_4.txt @@ -0,0 +1 @@ +A. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_3/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..84040518fdd8e6ffc996a017ae225126391adf40 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_3/order_0.txt @@ -0,0 +1 @@ +M. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_3/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..84040518fdd8e6ffc996a017ae225126391adf40 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_3/order_1.txt @@ -0,0 +1 @@ +M. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_3/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..84040518fdd8e6ffc996a017ae225126391adf40 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_3/order_2.txt @@ -0,0 +1 @@ +M. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_3/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..84040518fdd8e6ffc996a017ae225126391adf40 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_3/order_3.txt @@ -0,0 +1 @@ +M. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_3/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..95c51fcea27065b1b4798f243143607296fda12f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_3/order_4.txt @@ -0,0 +1 @@ +N. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_4/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6cbe6c12444ee3a56c4e374859f0ab4960805fed --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_4/order_0.txt @@ -0,0 +1 @@ +B. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_4/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4335a90ed52448b1c74f7e44bf700126ef75d6dd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_4/order_1.txt @@ -0,0 +1 @@ +C. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_4/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4335a90ed52448b1c74f7e44bf700126ef75d6dd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_4/order_2.txt @@ -0,0 +1 @@ +C. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_4/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4335a90ed52448b1c74f7e44bf700126ef75d6dd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_4/order_3.txt @@ -0,0 +1 @@ +C. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_4/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4335a90ed52448b1c74f7e44bf700126ef75d6dd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_4/order_4.txt @@ -0,0 +1 @@ +C. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_5/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a06d7d0ca7d74102d3b9ce2351bb405e30a4e4f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_5/order_0.txt @@ -0,0 +1 @@ +B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_5/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a06d7d0ca7d74102d3b9ce2351bb405e30a4e4f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_5/order_1.txt @@ -0,0 +1 @@ +B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_5/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9574b0a41522c19a313f28691f9380d3619ac68d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_5/order_2.txt @@ -0,0 +1 @@ +C. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_5/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a06d7d0ca7d74102d3b9ce2351bb405e30a4e4f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_5/order_3.txt @@ -0,0 +1 @@ +B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_5/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a06d7d0ca7d74102d3b9ce2351bb405e30a4e4f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_5/order_4.txt @@ -0,0 +1 @@ +B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_6/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a154c43202526d29615c1cba44867122477a0ac5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_6/order_0.txt @@ -0,0 +1 @@ +F. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_6/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b922c84801117f9f9b34ab1a24ac1c3401811dd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_6/order_1.txt @@ -0,0 +1 @@ +G. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_6/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b922c84801117f9f9b34ab1a24ac1c3401811dd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_6/order_2.txt @@ -0,0 +1 @@ +G. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_6/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a154c43202526d29615c1cba44867122477a0ac5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_6/order_3.txt @@ -0,0 +1 @@ +F. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_6/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a154c43202526d29615c1cba44867122477a0ac5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_6/order_4.txt @@ -0,0 +1 @@ +F. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_7/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c9280591fab665aea606c62faf687f35ec17014a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_7/order_0.txt @@ -0,0 +1 @@ +N. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_7/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c9280591fab665aea606c62faf687f35ec17014a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_7/order_1.txt @@ -0,0 +1 @@ +N. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_7/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c9280591fab665aea606c62faf687f35ec17014a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_7/order_2.txt @@ -0,0 +1 @@ +N. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_7/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c9280591fab665aea606c62faf687f35ec17014a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_7/order_3.txt @@ -0,0 +1 @@ +N. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_7/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c9280591fab665aea606c62faf687f35ec17014a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_7/order_4.txt @@ -0,0 +1 @@ +N. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_8/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2bc6cf23d90b1b6e24f4327190e7de06b355588d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_8/order_0.txt @@ -0,0 +1 @@ +E. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_8/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad2c32f659858ad34579205ef6266e84f272e26d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_8/order_1.txt @@ -0,0 +1 @@ +A. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_8/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad2c32f659858ad34579205ef6266e84f272e26d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_8/order_2.txt @@ -0,0 +1 @@ +A. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_8/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad2c32f659858ad34579205ef6266e84f272e26d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_8/order_3.txt @@ -0,0 +1 @@ +A. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_8/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2bc6cf23d90b1b6e24f4327190e7de06b355588d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_8/order_4.txt @@ -0,0 +1 @@ +E. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_9/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f64fa0d326b4861ef9b8283f17c9abee9db7035 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_9/order_0.txt @@ -0,0 +1 @@ +A. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_9/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f64fa0d326b4861ef9b8283f17c9abee9db7035 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_9/order_1.txt @@ -0,0 +1 @@ +A. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_9/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f64fa0d326b4861ef9b8283f17c9abee9db7035 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_9/order_2.txt @@ -0,0 +1 @@ +A. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_9/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f64fa0d326b4861ef9b8283f17c9abee9db7035 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_9/order_3.txt @@ -0,0 +1 @@ +A. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_9/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f64fa0d326b4861ef9b8283f17c9abee9db7035 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_2/sample_9/order_4.txt @@ -0,0 +1 @@ +A. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_1/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..caf80c652d7b2a9698d0489eb3064827fe945ef5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_1/order_0.txt @@ -0,0 +1 @@ +K. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_1/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..caf80c652d7b2a9698d0489eb3064827fe945ef5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_1/order_1.txt @@ -0,0 +1 @@ +K. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_1/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..caf80c652d7b2a9698d0489eb3064827fe945ef5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_1/order_2.txt @@ -0,0 +1 @@ +K. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_1/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..caf80c652d7b2a9698d0489eb3064827fe945ef5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_1/order_3.txt @@ -0,0 +1 @@ +K. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_1/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..caf80c652d7b2a9698d0489eb3064827fe945ef5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_1/order_4.txt @@ -0,0 +1 @@ +K. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_10/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b29537478cfec01d43434ac400bba0b56384016 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_10/order_0.txt @@ -0,0 +1 @@ +CONTENE_FILRER. \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_10/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f8233adbc15dffd0f3c2ea80d25e54f153feb51e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_10/order_1.txt @@ -0,0 +1 @@ +G. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_10/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f8233adbc15dffd0f3c2ea80d25e54f153feb51e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_10/order_2.txt @@ -0,0 +1 @@ +G. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_10/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b5f2e55eda95f15335f5cd63d7eb75fd8414c797 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_10/order_3.txt @@ -0,0 +1 @@ +F. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_10/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b5f2e55eda95f15335f5cd63d7eb75fd8414c797 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_10/order_4.txt @@ -0,0 +1 @@ +F. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_11/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fed83117e891372f464f3c40ccde41cfb16e5c8a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_11/order_0.txt @@ -0,0 +1 @@ +A. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_11/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fed83117e891372f464f3c40ccde41cfb16e5c8a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_11/order_1.txt @@ -0,0 +1 @@ +A. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_11/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..fed83117e891372f464f3c40ccde41cfb16e5c8a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_11/order_2.txt @@ -0,0 +1 @@ +A. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_11/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..fed83117e891372f464f3c40ccde41cfb16e5c8a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_11/order_3.txt @@ -0,0 +1 @@ +A. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_11/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..fed83117e891372f464f3c40ccde41cfb16e5c8a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_11/order_4.txt @@ -0,0 +1 @@ +A. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_12/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..93f07f129465202429a811982c4081a4d460eaef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_12/order_0.txt @@ -0,0 +1 @@ +A. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_12/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..50660968897f358802b8ad8147be24df49ba96df --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_12/order_1.txt @@ -0,0 +1 @@ +E. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_12/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..93f07f129465202429a811982c4081a4d460eaef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_12/order_2.txt @@ -0,0 +1 @@ +A. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_12/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..93f07f129465202429a811982c4081a4d460eaef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_12/order_3.txt @@ -0,0 +1 @@ +A. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_12/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..93f07f129465202429a811982c4081a4d460eaef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_12/order_4.txt @@ -0,0 +1 @@ +A. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_13/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6d67bde6abfea7041945c1d7af6bccc131b17bbc --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_13/order_0.txt @@ -0,0 +1 @@ +N. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_13/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..450eca0b704a8cb79defb994f00ce0109c00cf91 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_13/order_1.txt @@ -0,0 +1 @@ +M. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_13/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..450eca0b704a8cb79defb994f00ce0109c00cf91 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_13/order_2.txt @@ -0,0 +1 @@ +M. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_13/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..450eca0b704a8cb79defb994f00ce0109c00cf91 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_13/order_3.txt @@ -0,0 +1 @@ +M. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_13/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..450eca0b704a8cb79defb994f00ce0109c00cf91 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_13/order_4.txt @@ -0,0 +1 @@ +M. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_14/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..c72d16f4049489d6a5986ee95c283482b65e8a29 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_14/order_0.txt @@ -0,0 +1 @@ +M. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_14/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..939b93d185a7aab7fbead0bd24d18a54824341e4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_14/order_1.txt @@ -0,0 +1 @@ +O. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_14/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..939b93d185a7aab7fbead0bd24d18a54824341e4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_14/order_2.txt @@ -0,0 +1 @@ +O. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_14/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..939b93d185a7aab7fbead0bd24d18a54824341e4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_14/order_3.txt @@ -0,0 +1 @@ +O. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_14/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..939b93d185a7aab7fbead0bd24d18a54824341e4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_14/order_4.txt @@ -0,0 +1 @@ +O. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_15/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..df7fd34eeab9a6c1cb128bc1141572c2ef5b95c2 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_15/order_0.txt @@ -0,0 +1 @@ +B. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_15/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..88c6cde00a2062fc41230f0c8c5b0d074e2ae428 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_15/order_1.txt @@ -0,0 +1 @@ +C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_15/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..88c6cde00a2062fc41230f0c8c5b0d074e2ae428 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_15/order_2.txt @@ -0,0 +1 @@ +C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_15/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..88c6cde00a2062fc41230f0c8c5b0d074e2ae428 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_15/order_3.txt @@ -0,0 +1 @@ +C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_15/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..88c6cde00a2062fc41230f0c8c5b0d074e2ae428 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_15/order_4.txt @@ -0,0 +1 @@ +C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_16/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4237cd980cd839273a83cb7b2b85921b37434186 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_16/order_0.txt @@ -0,0 +1 @@ +F. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_16/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4237cd980cd839273a83cb7b2b85921b37434186 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_16/order_1.txt @@ -0,0 +1 @@ +F. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_16/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4237cd980cd839273a83cb7b2b85921b37434186 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_16/order_2.txt @@ -0,0 +1 @@ +F. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_16/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4237cd980cd839273a83cb7b2b85921b37434186 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_16/order_3.txt @@ -0,0 +1 @@ +F. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_16/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..0f72e029dd84aff08de2ce74e9782de0899339ec --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_16/order_4.txt @@ -0,0 +1 @@ +J. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_17/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ec714eecffd9c487f25cea09ca08d85719a5f96e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_17/order_0.txt @@ -0,0 +1 @@ +G. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_17/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..0c1fbfc862f27a0d89c7e7c85e49f9ce39eadd2a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_17/order_1.txt @@ -0,0 +1 @@ +H. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_17/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..0c1fbfc862f27a0d89c7e7c85e49f9ce39eadd2a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_17/order_2.txt @@ -0,0 +1 @@ +H. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_17/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ec714eecffd9c487f25cea09ca08d85719a5f96e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_17/order_3.txt @@ -0,0 +1 @@ +G. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_17/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ec714eecffd9c487f25cea09ca08d85719a5f96e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_17/order_4.txt @@ -0,0 +1 @@ +G. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_18/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_18/order_0.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_18/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_18/order_1.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_18/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_18/order_2.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_18/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_18/order_3.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_18/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_18/order_4.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_19/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_19/order_0.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_19/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_19/order_1.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_19/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b4e1b63089fcad515d8a61751eabedc00193569 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_19/order_2.txt @@ -0,0 +1 @@ +K. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_19/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_19/order_3.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_19/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_19/order_4.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_2/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b29537478cfec01d43434ac400bba0b56384016 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_2/order_0.txt @@ -0,0 +1 @@ +CONTENE_FILRER. \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_2/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e0dbb6dee2a2098b51f920c05b4ac3cdd907b093 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_2/order_1.txt @@ -0,0 +1 @@ +N. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_2/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e0dbb6dee2a2098b51f920c05b4ac3cdd907b093 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_2/order_2.txt @@ -0,0 +1 @@ +N. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_2/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e0dbb6dee2a2098b51f920c05b4ac3cdd907b093 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_2/order_3.txt @@ -0,0 +1 @@ +N. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_2/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4a68ebfde4b67da1720f3fe97108dd4b2d5c4a40 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_2/order_4.txt @@ -0,0 +1 @@ +O. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_20/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f72bef47dbc2768994153539d80421aef99397ba --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_20/order_0.txt @@ -0,0 +1 @@ +O. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_20/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b29537478cfec01d43434ac400bba0b56384016 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_20/order_1.txt @@ -0,0 +1 @@ +CONTENE_FILRER. \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_20/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a54ab342df6381550d14fb7f136581e3235fea5a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_20/order_2.txt @@ -0,0 +1 @@ +N. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_20/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7973f8fdcade2def238f70b25c564e76699783b8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_20/order_3.txt @@ -0,0 +1 @@ +L. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_20/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f72bef47dbc2768994153539d80421aef99397ba --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_20/order_4.txt @@ -0,0 +1 @@ +O. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_3/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ff2b1f1400c4f731cfdb1119268da254010e80c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_3/order_0.txt @@ -0,0 +1 @@ +E. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_3/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ff2b1f1400c4f731cfdb1119268da254010e80c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_3/order_1.txt @@ -0,0 +1 @@ +E. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_3/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ff2b1f1400c4f731cfdb1119268da254010e80c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_3/order_2.txt @@ -0,0 +1 @@ +E. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_3/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ff2b1f1400c4f731cfdb1119268da254010e80c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_3/order_3.txt @@ -0,0 +1 @@ +E. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_3/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..36b964b22b10d186edd98e4f9899caacf6725501 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_3/order_4.txt @@ -0,0 +1 @@ +C. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_4/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b29537478cfec01d43434ac400bba0b56384016 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_4/order_0.txt @@ -0,0 +1 @@ +CONTENE_FILRER. \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_4/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c8924966fb5d035b25e00e268f222224e66cb2be --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_4/order_1.txt @@ -0,0 +1 @@ +G. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_4/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c8924966fb5d035b25e00e268f222224e66cb2be --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_4/order_2.txt @@ -0,0 +1 @@ +G. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_4/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c8924966fb5d035b25e00e268f222224e66cb2be --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_4/order_3.txt @@ -0,0 +1 @@ +G. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_4/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c8924966fb5d035b25e00e268f222224e66cb2be --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_4/order_4.txt @@ -0,0 +1 @@ +G. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_5/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6491783a4c60c11c9a1e52b16beffac9244e67d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_5/order_0.txt @@ -0,0 +1 @@ +O. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_5/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6491783a4c60c11c9a1e52b16beffac9244e67d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_5/order_1.txt @@ -0,0 +1 @@ +O. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_5/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6491783a4c60c11c9a1e52b16beffac9244e67d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_5/order_2.txt @@ -0,0 +1 @@ +O. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_5/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6491783a4c60c11c9a1e52b16beffac9244e67d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_5/order_3.txt @@ -0,0 +1 @@ +O. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_5/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6491783a4c60c11c9a1e52b16beffac9244e67d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_5/order_4.txt @@ -0,0 +1 @@ +O. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_6/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b29537478cfec01d43434ac400bba0b56384016 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_6/order_0.txt @@ -0,0 +1 @@ +CONTENE_FILRER. \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_6/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..398d2fb5b465d779d31a4b9420edf8557bccf2f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_6/order_1.txt @@ -0,0 +1 @@ +C. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_6/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..398d2fb5b465d779d31a4b9420edf8557bccf2f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_6/order_2.txt @@ -0,0 +1 @@ +C. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_6/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..398d2fb5b465d779d31a4b9420edf8557bccf2f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_6/order_3.txt @@ -0,0 +1 @@ +C. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_6/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6f64fa0d326b4861ef9b8283f17c9abee9db7035 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_6/order_4.txt @@ -0,0 +1 @@ +A. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_7/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..766939aaaf9d2f33a29eb103d53d884640f16d6b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_7/order_0.txt @@ -0,0 +1 @@ +M. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_7/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..44d18ebe03fbb4a0d1648d7a5fcb957f5b90724f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_7/order_1.txt @@ -0,0 +1 @@ +L. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_7/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..44d18ebe03fbb4a0d1648d7a5fcb957f5b90724f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_7/order_2.txt @@ -0,0 +1 @@ +L. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_7/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..44d18ebe03fbb4a0d1648d7a5fcb957f5b90724f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_7/order_3.txt @@ -0,0 +1 @@ +L. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_7/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..44d18ebe03fbb4a0d1648d7a5fcb957f5b90724f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_7/order_4.txt @@ -0,0 +1 @@ +L. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_8/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b29537478cfec01d43434ac400bba0b56384016 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_8/order_0.txt @@ -0,0 +1 @@ +CONTENE_FILRER. \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_8/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..1cea3cfae685e297d26ca60270ad12fdd82bd2e6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_8/order_1.txt @@ -0,0 +1 @@ +E. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_8/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1cea3cfae685e297d26ca60270ad12fdd82bd2e6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_8/order_2.txt @@ -0,0 +1 @@ +E. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_8/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..1cea3cfae685e297d26ca60270ad12fdd82bd2e6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_8/order_3.txt @@ -0,0 +1 @@ +E. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_8/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..84040518fdd8e6ffc996a017ae225126391adf40 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_8/order_4.txt @@ -0,0 +1 @@ +M. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_9/order_0.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..50f7bcbf7ab38ec95ab86c7dd20b042b741c2817 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_9/order_0.txt @@ -0,0 +1 @@ +F. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_9/order_1.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..50f7bcbf7ab38ec95ab86c7dd20b042b741c2817 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_9/order_1.txt @@ -0,0 +1 @@ +F. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_9/order_2.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..50f7bcbf7ab38ec95ab86c7dd20b042b741c2817 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_9/order_2.txt @@ -0,0 +1 @@ +F. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_9/order_3.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..043750ba8be3608c7df5257f16bc06e3142595b0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_9/order_3.txt @@ -0,0 +1 @@ +J. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_9/order_4.txt b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..50f7bcbf7ab38ec95ab86c7dd20b042b741c2817 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/No_Tell/MC/length_3/sample_9/order_4.txt @@ -0,0 +1 @@ +F. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_1/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba52ebad94a8694e71d1c61a1f5a610f6d159ad4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_1/order_0.txt @@ -0,0 +1 @@ +B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_1/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba52ebad94a8694e71d1c61a1f5a610f6d159ad4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_1/order_1.txt @@ -0,0 +1 @@ +B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_1/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b69df92f3e4ae537d548eadd49a8be18257e3ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_1/order_2.txt @@ -0,0 +1 @@ +A. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_1/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b69df92f3e4ae537d548eadd49a8be18257e3ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_1/order_3.txt @@ -0,0 +1 @@ +A. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_1/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b69df92f3e4ae537d548eadd49a8be18257e3ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_1/order_4.txt @@ -0,0 +1 @@ +A. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_10/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..47ddb6939398a9dfb3517850577fc6c19a139352 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_10/order_0.txt @@ -0,0 +1 @@ +B. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_10/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5232a3af3c291d3e68d5cf80b8d40b4bca541cd4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_10/order_1.txt @@ -0,0 +1 @@ +A. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_10/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5232a3af3c291d3e68d5cf80b8d40b4bca541cd4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_10/order_2.txt @@ -0,0 +1 @@ +A. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_10/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5232a3af3c291d3e68d5cf80b8d40b4bca541cd4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_10/order_3.txt @@ -0,0 +1 @@ +A. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_10/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5232a3af3c291d3e68d5cf80b8d40b4bca541cd4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_10/order_4.txt @@ -0,0 +1 @@ +A. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_11/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3bf7f8bd23f5e9776716245e0f154177f6fd1a7c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_11/order_0.txt @@ -0,0 +1 @@ +H. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_11/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cc819aa574392d7d7507c98764deb0089020a35 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_11/order_1.txt @@ -0,0 +1 @@ +F. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_11/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6dc01f6af50983461439ef6ed20a6fc3f1fbbe1e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_11/order_2.txt @@ -0,0 +1 @@ +I. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_11/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6dc01f6af50983461439ef6ed20a6fc3f1fbbe1e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_11/order_3.txt @@ -0,0 +1 @@ +I. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_11/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6dc01f6af50983461439ef6ed20a6fc3f1fbbe1e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_11/order_4.txt @@ -0,0 +1 @@ +I. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_12/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b29537478cfec01d43434ac400bba0b56384016 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_12/order_0.txt @@ -0,0 +1 @@ +CONTENE_FILRER. \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_12/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9814f89dd18447778d14a465ad075b896ec5e7ed --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_12/order_1.txt @@ -0,0 +1 @@ +O. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_12/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9814f89dd18447778d14a465ad075b896ec5e7ed --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_12/order_2.txt @@ -0,0 +1 @@ +O. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_12/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..17acea5687120a02dee8b726eda6f4890394c0d8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_12/order_3.txt @@ -0,0 +1 @@ +K. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_12/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f181ff15a4a57e50a7053612f04d0023a2fd82c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_12/order_4.txt @@ -0,0 +1 @@ +N. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_13/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b29537478cfec01d43434ac400bba0b56384016 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_13/order_0.txt @@ -0,0 +1 @@ +CONTENE_FILRER. \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_13/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..30f3ff4afb936058eb189b8cecada7811428a9f1 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_13/order_1.txt @@ -0,0 +1 @@ +A. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_13/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..30f3ff4afb936058eb189b8cecada7811428a9f1 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_13/order_2.txt @@ -0,0 +1 @@ +A. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_13/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..30f3ff4afb936058eb189b8cecada7811428a9f1 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_13/order_3.txt @@ -0,0 +1 @@ +A. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_13/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..30f3ff4afb936058eb189b8cecada7811428a9f1 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_13/order_4.txt @@ -0,0 +1 @@ +A. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_14/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..75fe7cde90ed25447460e5682dd53a849019409a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_14/order_0.txt @@ -0,0 +1 @@ +K. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_14/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..df4d2f0aa0d05d8b2d2b166031cec14855a43816 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_14/order_1.txt @@ -0,0 +1 @@ +N. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_14/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..df4d2f0aa0d05d8b2d2b166031cec14855a43816 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_14/order_2.txt @@ -0,0 +1 @@ +N. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_14/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..df4d2f0aa0d05d8b2d2b166031cec14855a43816 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_14/order_3.txt @@ -0,0 +1 @@ +N. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_14/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..df4d2f0aa0d05d8b2d2b166031cec14855a43816 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_14/order_4.txt @@ -0,0 +1 @@ +N. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_15/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b29537478cfec01d43434ac400bba0b56384016 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_15/order_0.txt @@ -0,0 +1 @@ +CONTENE_FILRER. \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_15/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ce30660831f35a2a34207cded226e9a328d85947 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_15/order_1.txt @@ -0,0 +1 @@ +K. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_15/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ce30660831f35a2a34207cded226e9a328d85947 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_15/order_2.txt @@ -0,0 +1 @@ +K. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_15/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ce30660831f35a2a34207cded226e9a328d85947 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_15/order_3.txt @@ -0,0 +1 @@ +K. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_15/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ce30660831f35a2a34207cded226e9a328d85947 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_15/order_4.txt @@ -0,0 +1 @@ +K. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_16/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b29537478cfec01d43434ac400bba0b56384016 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_16/order_0.txt @@ -0,0 +1 @@ +CONTENE_FILRER. \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_16/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f2a53fe2503e9a82622b6fa3f3aaf492e5ae79b8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_16/order_1.txt @@ -0,0 +1 @@ +O. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_16/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f2a53fe2503e9a82622b6fa3f3aaf492e5ae79b8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_16/order_2.txt @@ -0,0 +1 @@ +O. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_16/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f2a53fe2503e9a82622b6fa3f3aaf492e5ae79b8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_16/order_3.txt @@ -0,0 +1 @@ +O. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_16/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f2a53fe2503e9a82622b6fa3f3aaf492e5ae79b8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_16/order_4.txt @@ -0,0 +1 @@ +O. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_17/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2d5ba6aa8bf2c0477f95ef252b831c35fe134778 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_17/order_0.txt @@ -0,0 +1 @@ +J. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_17/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6fbc45f9c95a0ade3b0bfd3c7b90df651c1ac429 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_17/order_1.txt @@ -0,0 +1 @@ +G. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_17/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6fbc45f9c95a0ade3b0bfd3c7b90df651c1ac429 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_17/order_2.txt @@ -0,0 +1 @@ +G. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_17/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6fbc45f9c95a0ade3b0bfd3c7b90df651c1ac429 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_17/order_3.txt @@ -0,0 +1 @@ +G. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_17/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6fbc45f9c95a0ade3b0bfd3c7b90df651c1ac429 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_17/order_4.txt @@ -0,0 +1 @@ +G. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_18/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b29537478cfec01d43434ac400bba0b56384016 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_18/order_0.txt @@ -0,0 +1 @@ +CONTENE_FILRER. \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_18/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e5f5c74df07ffa4d8e7ff469ceb806ff648f1bae --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_18/order_1.txt @@ -0,0 +1 @@ +E. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_18/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a21d819e017e6b559c9d1922fb8396976efd2b74 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_18/order_2.txt @@ -0,0 +1 @@ +D. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_18/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a21d819e017e6b559c9d1922fb8396976efd2b74 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_18/order_3.txt @@ -0,0 +1 @@ +D. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_18/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a21d819e017e6b559c9d1922fb8396976efd2b74 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_18/order_4.txt @@ -0,0 +1 @@ +D. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_19/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e4fb14412f118011cf467f1356d7867174d0e3f0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_19/order_0.txt @@ -0,0 +1 @@ +D. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_19/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e4fb14412f118011cf467f1356d7867174d0e3f0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_19/order_1.txt @@ -0,0 +1 @@ +D. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_19/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e4fb14412f118011cf467f1356d7867174d0e3f0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_19/order_2.txt @@ -0,0 +1 @@ +D. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_19/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e6ee9c457800add97cc2ce4e8a9e0e7bb4d52625 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_19/order_3.txt @@ -0,0 +1 @@ +B. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_19/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e4fb14412f118011cf467f1356d7867174d0e3f0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_19/order_4.txt @@ -0,0 +1 @@ +D. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_2/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5232a3af3c291d3e68d5cf80b8d40b4bca541cd4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_2/order_0.txt @@ -0,0 +1 @@ +A. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_2/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5232a3af3c291d3e68d5cf80b8d40b4bca541cd4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_2/order_1.txt @@ -0,0 +1 @@ +A. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_2/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..398d2fb5b465d779d31a4b9420edf8557bccf2f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_2/order_2.txt @@ -0,0 +1 @@ +C. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_2/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2bc6cf23d90b1b6e24f4327190e7de06b355588d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_2/order_3.txt @@ -0,0 +1 @@ +E. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_2/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2bc6cf23d90b1b6e24f4327190e7de06b355588d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_2/order_4.txt @@ -0,0 +1 @@ +E. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_20/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..22faaa3463fee8b97741bfa08ad37f6d2d6bcdc2 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_20/order_0.txt @@ -0,0 +1 @@ +O. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_20/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..618eef651c5d5adfa784840551836610ee9825d0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_20/order_1.txt @@ -0,0 +1 @@ +N. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_20/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..618eef651c5d5adfa784840551836610ee9825d0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_20/order_2.txt @@ -0,0 +1 @@ +N. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_20/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..618eef651c5d5adfa784840551836610ee9825d0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_20/order_3.txt @@ -0,0 +1 @@ +N. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_20/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..618eef651c5d5adfa784840551836610ee9825d0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_20/order_4.txt @@ -0,0 +1 @@ +N. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_3/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7a695f1bd8998a8d41f54413ed8d9af9bffb483d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_3/order_0.txt @@ -0,0 +1 @@ +E. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_3/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7a695f1bd8998a8d41f54413ed8d9af9bffb483d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_3/order_1.txt @@ -0,0 +1 @@ +E. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_3/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d174a254924ebeabcb8f39041e31dfeb19ae51a6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_3/order_2.txt @@ -0,0 +1 @@ +D. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_3/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca23c126bfc9159d60ba7dad014d7d5919b8274c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_3/order_3.txt @@ -0,0 +1 @@ +B. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_3/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..49ccbbff2467c29135cb108bd90e4fb567ec4f3b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_3/order_4.txt @@ -0,0 +1 @@ +C. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_4/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..02867678b8550f616b6632800638fdc3fa45d42f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_4/order_0.txt @@ -0,0 +1 @@ +L. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_4/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..02867678b8550f616b6632800638fdc3fa45d42f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_4/order_1.txt @@ -0,0 +1 @@ +L. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_4/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..02867678b8550f616b6632800638fdc3fa45d42f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_4/order_2.txt @@ -0,0 +1 @@ +L. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_4/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..02867678b8550f616b6632800638fdc3fa45d42f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_4/order_3.txt @@ -0,0 +1 @@ +L. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_4/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..02867678b8550f616b6632800638fdc3fa45d42f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_4/order_4.txt @@ -0,0 +1 @@ +L. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_5/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e1abfa38ec1d41da58d87dc2defcb46dba2ece31 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_5/order_0.txt @@ -0,0 +1 @@ +L. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_5/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e1abfa38ec1d41da58d87dc2defcb46dba2ece31 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_5/order_1.txt @@ -0,0 +1 @@ +L. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_5/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..fc09885bebc5dbde8e43902e023f8244b169fc8f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_5/order_2.txt @@ -0,0 +1 @@ +N. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_5/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..fc09885bebc5dbde8e43902e023f8244b169fc8f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_5/order_3.txt @@ -0,0 +1 @@ +N. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_5/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..fc09885bebc5dbde8e43902e023f8244b169fc8f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_5/order_4.txt @@ -0,0 +1 @@ +N. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_6/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..bb06a6162d999715b50ce2be0fad85f946e5ca64 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_6/order_0.txt @@ -0,0 +1 @@ +C. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_6/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a06d7d0ca7d74102d3b9ce2351bb405e30a4e4f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_6/order_1.txt @@ -0,0 +1 @@ +B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_6/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a06d7d0ca7d74102d3b9ce2351bb405e30a4e4f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_6/order_2.txt @@ -0,0 +1 @@ +B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_6/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a06d7d0ca7d74102d3b9ce2351bb405e30a4e4f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_6/order_3.txt @@ -0,0 +1 @@ +B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_6/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a06d7d0ca7d74102d3b9ce2351bb405e30a4e4f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_6/order_4.txt @@ -0,0 +1 @@ +B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_7/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..62aaddb4e2403b47e88ee1a9f651ab88fce88bc7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_7/order_0.txt @@ -0,0 +1 @@ +N. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_7/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..62aaddb4e2403b47e88ee1a9f651ab88fce88bc7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_7/order_1.txt @@ -0,0 +1 @@ +N. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_7/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..475ae7964989fd355660647303c8dff78962dd30 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_7/order_2.txt @@ -0,0 +1 @@ +L. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_7/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..475ae7964989fd355660647303c8dff78962dd30 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_7/order_3.txt @@ -0,0 +1 @@ +L. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_7/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..62aaddb4e2403b47e88ee1a9f651ab88fce88bc7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_7/order_4.txt @@ -0,0 +1 @@ +N. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_8/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..bdba658c9e0d8aa110868a4f4bc461e2b0c73ca5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_8/order_0.txt @@ -0,0 +1 @@ +K. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_8/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d7440574279100430f3674ddc8c64d31888cf355 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_8/order_1.txt @@ -0,0 +1 @@ +L. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_8/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d7440574279100430f3674ddc8c64d31888cf355 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_8/order_2.txt @@ -0,0 +1 @@ +L. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_8/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d7440574279100430f3674ddc8c64d31888cf355 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_8/order_3.txt @@ -0,0 +1 @@ +L. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_8/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..bdba658c9e0d8aa110868a4f4bc461e2b0c73ca5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_8/order_4.txt @@ -0,0 +1 @@ +K. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_9/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d8517557ef31e52857cac921f7e9f6f8f1285e2e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_9/order_0.txt @@ -0,0 +1 @@ +F. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_9/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..afbc9004d72e2de17c3c1bc46163b58eba0cd43b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_9/order_1.txt @@ -0,0 +1 @@ +H. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_9/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ee3e75a3e2959d95b9db39cbf25e15f18046baec --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_9/order_2.txt @@ -0,0 +1 @@ +G. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_9/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ee3e75a3e2959d95b9db39cbf25e15f18046baec --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_9/order_3.txt @@ -0,0 +1 @@ +G. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_9/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ee3e75a3e2959d95b9db39cbf25e15f18046baec --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_1/sample_9/order_4.txt @@ -0,0 +1 @@ +G. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_1/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fa5a3dbd005b6451278e75e045c0fd05ccf1608f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_1/order_0.txt @@ -0,0 +1 @@ +F. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_1/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8297445e8078b7b5d79a61bd6a320cb1831e57bb --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_1/order_1.txt @@ -0,0 +1 @@ +G. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_1/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8297445e8078b7b5d79a61bd6a320cb1831e57bb --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_1/order_2.txt @@ -0,0 +1 @@ +G. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_1/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8297445e8078b7b5d79a61bd6a320cb1831e57bb --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_1/order_3.txt @@ -0,0 +1 @@ +G. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_1/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8297445e8078b7b5d79a61bd6a320cb1831e57bb --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_1/order_4.txt @@ -0,0 +1 @@ +G. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_10/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fed6f6d9bdfb1d41fc48e5b1783750e5c5a20d7e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_10/order_0.txt @@ -0,0 +1 @@ +K. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_10/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_10/order_1.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_10/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8cd50425785fdfdc4875e9a4478137f1290aedcf --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_10/order_2.txt @@ -0,0 +1 @@ +M. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_10/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8cd50425785fdfdc4875e9a4478137f1290aedcf --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_10/order_3.txt @@ -0,0 +1 @@ +M. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_10/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8cd50425785fdfdc4875e9a4478137f1290aedcf --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_10/order_4.txt @@ -0,0 +1 @@ +M. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_11/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f7b160edac53a3700f2144795a223fb848c9e6d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_11/order_0.txt @@ -0,0 +1 @@ +A. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_11/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f7b160edac53a3700f2144795a223fb848c9e6d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_11/order_1.txt @@ -0,0 +1 @@ +A. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_11/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4e3051b728132ab1a5b0b97dddd07dfc48e88fd6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_11/order_2.txt @@ -0,0 +1 @@ +E. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_11/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..4e3051b728132ab1a5b0b97dddd07dfc48e88fd6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_11/order_3.txt @@ -0,0 +1 @@ +E. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_11/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8b790f864d1c3d98410f55937aecd07ff47dc4c1 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_11/order_4.txt @@ -0,0 +1 @@ +B. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_12/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d44620b08fb34b5a19f2f46ce51467304f010018 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_12/order_0.txt @@ -0,0 +1 @@ +L. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_12/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..939b93d185a7aab7fbead0bd24d18a54824341e4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_12/order_1.txt @@ -0,0 +1 @@ +O. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_12/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d44620b08fb34b5a19f2f46ce51467304f010018 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_12/order_2.txt @@ -0,0 +1 @@ +L. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_12/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d44620b08fb34b5a19f2f46ce51467304f010018 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_12/order_3.txt @@ -0,0 +1 @@ +L. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_12/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..939b93d185a7aab7fbead0bd24d18a54824341e4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_12/order_4.txt @@ -0,0 +1 @@ +O. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_13/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..df794401fc59db930b5a360374ce899b74a05c44 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_13/order_0.txt @@ -0,0 +1 @@ +A. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_13/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..df794401fc59db930b5a360374ce899b74a05c44 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_13/order_1.txt @@ -0,0 +1 @@ +A. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_13/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..df794401fc59db930b5a360374ce899b74a05c44 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_13/order_2.txt @@ -0,0 +1 @@ +A. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_13/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..df794401fc59db930b5a360374ce899b74a05c44 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_13/order_3.txt @@ -0,0 +1 @@ +A. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_13/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..df794401fc59db930b5a360374ce899b74a05c44 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_13/order_4.txt @@ -0,0 +1 @@ +A. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_14/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c19b723e4927ca12fdd55a5f537ef0554730637 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_14/order_0.txt @@ -0,0 +1 @@ +L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_14/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c19b723e4927ca12fdd55a5f537ef0554730637 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_14/order_1.txt @@ -0,0 +1 @@ +L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_14/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c19b723e4927ca12fdd55a5f537ef0554730637 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_14/order_2.txt @@ -0,0 +1 @@ +L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_14/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c19b723e4927ca12fdd55a5f537ef0554730637 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_14/order_3.txt @@ -0,0 +1 @@ +L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_14/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c19b723e4927ca12fdd55a5f537ef0554730637 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_14/order_4.txt @@ -0,0 +1 @@ +L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_15/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e4fb14412f118011cf467f1356d7867174d0e3f0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_15/order_0.txt @@ -0,0 +1 @@ +D. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_15/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..49b699df98f863744ce461d2b1639bb4168ce27b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_15/order_1.txt @@ -0,0 +1 @@ +A. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_15/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..49b699df98f863744ce461d2b1639bb4168ce27b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_15/order_2.txt @@ -0,0 +1 @@ +A. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_15/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..49b699df98f863744ce461d2b1639bb4168ce27b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_15/order_3.txt @@ -0,0 +1 @@ +A. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_15/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..49b699df98f863744ce461d2b1639bb4168ce27b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_15/order_4.txt @@ -0,0 +1 @@ +A. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_16/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba52ebad94a8694e71d1c61a1f5a610f6d159ad4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_16/order_0.txt @@ -0,0 +1 @@ +B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_16/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba52ebad94a8694e71d1c61a1f5a610f6d159ad4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_16/order_1.txt @@ -0,0 +1 @@ +B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_16/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba52ebad94a8694e71d1c61a1f5a610f6d159ad4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_16/order_2.txt @@ -0,0 +1 @@ +B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_16/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba52ebad94a8694e71d1c61a1f5a610f6d159ad4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_16/order_3.txt @@ -0,0 +1 @@ +B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_16/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba52ebad94a8694e71d1c61a1f5a610f6d159ad4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_16/order_4.txt @@ -0,0 +1 @@ +B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_17/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..87f7e79c16f9fac8b9ca168a8d33744137a201d6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_17/order_0.txt @@ -0,0 +1 @@ +K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_17/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..87f7e79c16f9fac8b9ca168a8d33744137a201d6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_17/order_1.txt @@ -0,0 +1 @@ +K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_17/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f7d6fc5d75cd980666a077197be37487433e7dff --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_17/order_2.txt @@ -0,0 +1 @@ +J. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_17/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..87f7e79c16f9fac8b9ca168a8d33744137a201d6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_17/order_3.txt @@ -0,0 +1 @@ +K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_17/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..87f7e79c16f9fac8b9ca168a8d33744137a201d6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_17/order_4.txt @@ -0,0 +1 @@ +K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_18/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..05f1ca84379afba3daf58afe69aebe289fb5be4e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_18/order_0.txt @@ -0,0 +1 @@ +M. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_18/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fbf683925d6a1976c70d94d413eca790154de671 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_18/order_1.txt @@ -0,0 +1 @@ +O. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_18/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2a95c9fd92409f2869c9663f6c0c603506de4e55 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_18/order_2.txt @@ -0,0 +1 @@ +L. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_18/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2a95c9fd92409f2869c9663f6c0c603506de4e55 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_18/order_3.txt @@ -0,0 +1 @@ +L. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_18/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2a95c9fd92409f2869c9663f6c0c603506de4e55 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_18/order_4.txt @@ -0,0 +1 @@ +L. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_19/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b148e5546555d8499c461ba36bf1d86a70a40bb --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_19/order_0.txt @@ -0,0 +1 @@ +I. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_19/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..693b5c71027d3e30e3ab963c96d7409907cd7811 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_19/order_1.txt @@ -0,0 +1 @@ +J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_19/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..693b5c71027d3e30e3ab963c96d7409907cd7811 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_19/order_2.txt @@ -0,0 +1 @@ +J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_19/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f2a2928633a2c7004301f9fd2a2e46809a88675e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_19/order_3.txt @@ -0,0 +1 @@ +G. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_19/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f2a2928633a2c7004301f9fd2a2e46809a88675e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_19/order_4.txt @@ -0,0 +1 @@ +G. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_2/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d59fe2a8c4b4c5cf56a5b2bfe680115234a2c8d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_2/order_0.txt @@ -0,0 +1 @@ +O. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_2/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d59fe2a8c4b4c5cf56a5b2bfe680115234a2c8d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_2/order_1.txt @@ -0,0 +1 @@ +O. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_2/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d59fe2a8c4b4c5cf56a5b2bfe680115234a2c8d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_2/order_2.txt @@ -0,0 +1 @@ +O. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_2/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d59fe2a8c4b4c5cf56a5b2bfe680115234a2c8d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_2/order_3.txt @@ -0,0 +1 @@ +O. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_2/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d59fe2a8c4b4c5cf56a5b2bfe680115234a2c8d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_2/order_4.txt @@ -0,0 +1 @@ +O. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_20/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..488aaf0ea72cc1051111b2320743a8a387c42d17 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_20/order_0.txt @@ -0,0 +1 @@ +B. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_20/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..488aaf0ea72cc1051111b2320743a8a387c42d17 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_20/order_1.txt @@ -0,0 +1 @@ +B. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_20/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..015351113d53d8f675d4a27b1e6430027a32ba93 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_20/order_2.txt @@ -0,0 +1 @@ +A. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_20/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..015351113d53d8f675d4a27b1e6430027a32ba93 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_20/order_3.txt @@ -0,0 +1 @@ +A. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_20/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..015351113d53d8f675d4a27b1e6430027a32ba93 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_20/order_4.txt @@ -0,0 +1 @@ +A. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_3/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..78e73a8947e4fad4f25d4b47ff2492c457d8ef2a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_3/order_0.txt @@ -0,0 +1 @@ +B. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_3/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..78e73a8947e4fad4f25d4b47ff2492c457d8ef2a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_3/order_1.txt @@ -0,0 +1 @@ +B. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_3/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..78e73a8947e4fad4f25d4b47ff2492c457d8ef2a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_3/order_2.txt @@ -0,0 +1 @@ +B. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_3/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8d2c657898f6b513440be1e7ef80b7f0d2e8616f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_3/order_3.txt @@ -0,0 +1 @@ +A. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_3/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4335a90ed52448b1c74f7e44bf700126ef75d6dd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_3/order_4.txt @@ -0,0 +1 @@ +C. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_4/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b83503e475d1b3d7e1c2943073eda45600de4cd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_4/order_0.txt @@ -0,0 +1 @@ +G. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_4/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b83503e475d1b3d7e1c2943073eda45600de4cd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_4/order_1.txt @@ -0,0 +1 @@ +G. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_4/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b83503e475d1b3d7e1c2943073eda45600de4cd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_4/order_2.txt @@ -0,0 +1 @@ +G. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_4/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b83503e475d1b3d7e1c2943073eda45600de4cd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_4/order_3.txt @@ -0,0 +1 @@ +G. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_4/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b83503e475d1b3d7e1c2943073eda45600de4cd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_4/order_4.txt @@ -0,0 +1 @@ +G. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_5/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4086abca9d1f30bdfe5e2aad93bcd80b00fb60b7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_5/order_0.txt @@ -0,0 +1 @@ +F. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_5/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b4d1859d8f8904d5c67f162460d762b97b345446 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_5/order_1.txt @@ -0,0 +1 @@ +I. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_5/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b4d1859d8f8904d5c67f162460d762b97b345446 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_5/order_2.txt @@ -0,0 +1 @@ +I. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_5/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b4d1859d8f8904d5c67f162460d762b97b345446 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_5/order_3.txt @@ -0,0 +1 @@ +I. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_5/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b4d1859d8f8904d5c67f162460d762b97b345446 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_5/order_4.txt @@ -0,0 +1 @@ +I. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_6/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2825568621d7890e69cb953615fa9fe3bb85cc08 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_6/order_0.txt @@ -0,0 +1 @@ +L. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_6/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2825568621d7890e69cb953615fa9fe3bb85cc08 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_6/order_1.txt @@ -0,0 +1 @@ +L. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_6/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2825568621d7890e69cb953615fa9fe3bb85cc08 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_6/order_2.txt @@ -0,0 +1 @@ +L. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_6/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2825568621d7890e69cb953615fa9fe3bb85cc08 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_6/order_3.txt @@ -0,0 +1 @@ +L. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_6/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2825568621d7890e69cb953615fa9fe3bb85cc08 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_6/order_4.txt @@ -0,0 +1 @@ +L. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_7/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc4496397c4fd9939c7b8c5daa933392a440380a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_7/order_0.txt @@ -0,0 +1 @@ +B. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_7/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc4496397c4fd9939c7b8c5daa933392a440380a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_7/order_1.txt @@ -0,0 +1 @@ +B. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_7/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8c7c9d399f16cd97bab68e7efb29809ed17b30c8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_7/order_2.txt @@ -0,0 +1 @@ +A. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_7/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc4496397c4fd9939c7b8c5daa933392a440380a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_7/order_3.txt @@ -0,0 +1 @@ +B. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_7/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc4496397c4fd9939c7b8c5daa933392a440380a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_7/order_4.txt @@ -0,0 +1 @@ +B. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_8/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5700c4e42b3290f90ce8432ca9e1723cbcf39b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_8/order_0.txt @@ -0,0 +1 @@ +A. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_8/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5700c4e42b3290f90ce8432ca9e1723cbcf39b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_8/order_1.txt @@ -0,0 +1 @@ +A. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_8/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5700c4e42b3290f90ce8432ca9e1723cbcf39b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_8/order_2.txt @@ -0,0 +1 @@ +A. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_8/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5700c4e42b3290f90ce8432ca9e1723cbcf39b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_8/order_3.txt @@ -0,0 +1 @@ +A. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_8/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5700c4e42b3290f90ce8432ca9e1723cbcf39b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_8/order_4.txt @@ -0,0 +1 @@ +A. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_9/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d987bc2d531e93dfaedbc698b4d56e24efaa78b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_9/order_0.txt @@ -0,0 +1 @@ +D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_9/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d987bc2d531e93dfaedbc698b4d56e24efaa78b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_9/order_1.txt @@ -0,0 +1 @@ +D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_9/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d987bc2d531e93dfaedbc698b4d56e24efaa78b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_9/order_2.txt @@ -0,0 +1 @@ +D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_9/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d987bc2d531e93dfaedbc698b4d56e24efaa78b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_9/order_3.txt @@ -0,0 +1 @@ +D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_9/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d987bc2d531e93dfaedbc698b4d56e24efaa78b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_2/sample_9/order_4.txt @@ -0,0 +1 @@ +D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_1/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5113c76389d7563e77d6ebf6a73b5238743ae3f5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_1/order_0.txt @@ -0,0 +1 @@ +M. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_1/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c39318e0d7b091934dc635601522baf995cfb42c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_1/order_1.txt @@ -0,0 +1 @@ +A. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_1/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c39318e0d7b091934dc635601522baf995cfb42c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_1/order_2.txt @@ -0,0 +1 @@ +A. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_1/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c39318e0d7b091934dc635601522baf995cfb42c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_1/order_3.txt @@ -0,0 +1 @@ +A. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_1/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c39318e0d7b091934dc635601522baf995cfb42c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_1/order_4.txt @@ -0,0 +1 @@ +A. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_10/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fed83117e891372f464f3c40ccde41cfb16e5c8a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_10/order_0.txt @@ -0,0 +1 @@ +A. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_10/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9574b0a41522c19a313f28691f9380d3619ac68d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_10/order_1.txt @@ -0,0 +1 @@ +C. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_10/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9574b0a41522c19a313f28691f9380d3619ac68d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_10/order_2.txt @@ -0,0 +1 @@ +C. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_10/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..fed83117e891372f464f3c40ccde41cfb16e5c8a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_10/order_3.txt @@ -0,0 +1 @@ +A. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_10/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..fed83117e891372f464f3c40ccde41cfb16e5c8a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_10/order_4.txt @@ -0,0 +1 @@ +A. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_11/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..878a7d421efdd6bdbc2a315961eb3e55b2a8e367 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_11/order_0.txt @@ -0,0 +1 @@ +F. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_11/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..878a7d421efdd6bdbc2a315961eb3e55b2a8e367 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_11/order_1.txt @@ -0,0 +1 @@ +F. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_11/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..878a7d421efdd6bdbc2a315961eb3e55b2a8e367 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_11/order_2.txt @@ -0,0 +1 @@ +F. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_11/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..878a7d421efdd6bdbc2a315961eb3e55b2a8e367 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_11/order_3.txt @@ -0,0 +1 @@ +F. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_11/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..878a7d421efdd6bdbc2a315961eb3e55b2a8e367 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_11/order_4.txt @@ -0,0 +1 @@ +F. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_12/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..058f980e2760c76b2abeadc524c2b6604677bc0f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_12/order_0.txt @@ -0,0 +1 @@ +L. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_12/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..058f980e2760c76b2abeadc524c2b6604677bc0f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_12/order_1.txt @@ -0,0 +1 @@ +L. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_12/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..058f980e2760c76b2abeadc524c2b6604677bc0f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_12/order_2.txt @@ -0,0 +1 @@ +L. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_12/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..058f980e2760c76b2abeadc524c2b6604677bc0f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_12/order_3.txt @@ -0,0 +1 @@ +L. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_12/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..f72bef47dbc2768994153539d80421aef99397ba --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_12/order_4.txt @@ -0,0 +1 @@ +O. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_13/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..beafdfe4e6806eeee4e2c87ec3c2b9d23429c83d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_13/order_0.txt @@ -0,0 +1 @@ +B. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_13/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..59ccd1db21b7ec169432ce8dd79c602dbd3be44d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_13/order_1.txt @@ -0,0 +1 @@ +D. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_13/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..59ccd1db21b7ec169432ce8dd79c602dbd3be44d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_13/order_2.txt @@ -0,0 +1 @@ +D. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_13/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..59ccd1db21b7ec169432ce8dd79c602dbd3be44d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_13/order_3.txt @@ -0,0 +1 @@ +D. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_13/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..59ccd1db21b7ec169432ce8dd79c602dbd3be44d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_13/order_4.txt @@ -0,0 +1 @@ +D. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_14/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f553425c3c153ff8d9a359bf2b304904e8886da9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_14/order_0.txt @@ -0,0 +1 @@ +M. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_14/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca060d653221b07ac01cfe59ee63187514632c59 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_14/order_1.txt @@ -0,0 +1 @@ +L. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_14/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca060d653221b07ac01cfe59ee63187514632c59 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_14/order_2.txt @@ -0,0 +1 @@ +L. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_14/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca060d653221b07ac01cfe59ee63187514632c59 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_14/order_3.txt @@ -0,0 +1 @@ +L. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_14/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca060d653221b07ac01cfe59ee63187514632c59 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_14/order_4.txt @@ -0,0 +1 @@ +L. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_15/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2712dd86946df8149ff6bc89a44c36aabfa00ca7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_15/order_0.txt @@ -0,0 +1 @@ +N. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_15/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2712dd86946df8149ff6bc89a44c36aabfa00ca7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_15/order_1.txt @@ -0,0 +1 @@ +N. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_15/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2712dd86946df8149ff6bc89a44c36aabfa00ca7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_15/order_2.txt @@ -0,0 +1 @@ +N. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_15/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..83a6f1763c259bdda93d6f2d83c3c8ffe500b77a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_15/order_3.txt @@ -0,0 +1 @@ +K. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_15/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..83a6f1763c259bdda93d6f2d83c3c8ffe500b77a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_15/order_4.txt @@ -0,0 +1 @@ +K. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_16/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4eff4b66d1d499003fdc679860edf7f9a4571031 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_16/order_0.txt @@ -0,0 +1 @@ +J. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_16/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4eff4b66d1d499003fdc679860edf7f9a4571031 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_16/order_1.txt @@ -0,0 +1 @@ +J. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_16/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..67e1be4be039844f264ce66827a12f1bc0793074 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_16/order_2.txt @@ -0,0 +1 @@ +F. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_16/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..67e1be4be039844f264ce66827a12f1bc0793074 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_16/order_3.txt @@ -0,0 +1 @@ +F. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_16/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..67e1be4be039844f264ce66827a12f1bc0793074 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_16/order_4.txt @@ -0,0 +1 @@ +F. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_17/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..beafdfe4e6806eeee4e2c87ec3c2b9d23429c83d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_17/order_0.txt @@ -0,0 +1 @@ +B. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_17/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e03a4a3d9c4d1cf377409ed3b7dc70e6ae3a3a15 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_17/order_1.txt @@ -0,0 +1 @@ +D. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_17/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e03a4a3d9c4d1cf377409ed3b7dc70e6ae3a3a15 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_17/order_2.txt @@ -0,0 +1 @@ +D. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_17/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e03a4a3d9c4d1cf377409ed3b7dc70e6ae3a3a15 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_17/order_3.txt @@ -0,0 +1 @@ +D. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_17/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e03a4a3d9c4d1cf377409ed3b7dc70e6ae3a3a15 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_17/order_4.txt @@ -0,0 +1 @@ +D. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_18/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6428f74b867b409891ada024b90f1bd4f6f5c74d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_18/order_0.txt @@ -0,0 +1 @@ +G. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_18/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a62f6676f90611c800ac1361674dd590b38e1d3a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_18/order_1.txt @@ -0,0 +1 @@ +F. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_18/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a62f6676f90611c800ac1361674dd590b38e1d3a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_18/order_2.txt @@ -0,0 +1 @@ +F. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_18/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a62f6676f90611c800ac1361674dd590b38e1d3a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_18/order_3.txt @@ -0,0 +1 @@ +F. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_18/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6428f74b867b409891ada024b90f1bd4f6f5c74d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_18/order_4.txt @@ -0,0 +1 @@ +G. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_19/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_19/order_0.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_19/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_19/order_1.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_19/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_19/order_2.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_19/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_19/order_3.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_19/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_19/order_4.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_2/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b224627a040883f2a072f3579eba47d329376210 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_2/order_0.txt @@ -0,0 +1 @@ +D. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_2/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b224627a040883f2a072f3579eba47d329376210 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_2/order_1.txt @@ -0,0 +1 @@ +D. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_2/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b224627a040883f2a072f3579eba47d329376210 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_2/order_2.txt @@ -0,0 +1 @@ +D. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_2/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b224627a040883f2a072f3579eba47d329376210 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_2/order_3.txt @@ -0,0 +1 @@ +D. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_2/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b224627a040883f2a072f3579eba47d329376210 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_2/order_4.txt @@ -0,0 +1 @@ +D. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_20/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..273a2ef88e852179c5ca093b91bae0b321096229 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_20/order_0.txt @@ -0,0 +1 @@ +I. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_20/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4eff4b66d1d499003fdc679860edf7f9a4571031 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_20/order_1.txt @@ -0,0 +1 @@ +J. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_20/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4eff4b66d1d499003fdc679860edf7f9a4571031 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_20/order_2.txt @@ -0,0 +1 @@ +J. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_20/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7308cff673960e58655c0fa2933972df7f319f46 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_20/order_3.txt @@ -0,0 +1 @@ +H. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_20/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7308cff673960e58655c0fa2933972df7f319f46 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_20/order_4.txt @@ -0,0 +1 @@ +H. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_3/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..cea0ef33c2fc9d542c68187afdc1af7f6da3b292 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_3/order_0.txt @@ -0,0 +1 @@ +O. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_3/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..69f15ecdbc95f827e35e0f461a8c8a87111ac68b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_3/order_1.txt @@ -0,0 +1 @@ +M. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_3/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..69f15ecdbc95f827e35e0f461a8c8a87111ac68b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_3/order_2.txt @@ -0,0 +1 @@ +M. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_3/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..69f15ecdbc95f827e35e0f461a8c8a87111ac68b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_3/order_3.txt @@ -0,0 +1 @@ +M. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_3/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..69f15ecdbc95f827e35e0f461a8c8a87111ac68b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_3/order_4.txt @@ -0,0 +1 @@ +M. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_4/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..943b4511334ce98fdf92fe69eeb4bb2e190dc65b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_4/order_0.txt @@ -0,0 +1 @@ +F. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_4/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..943b4511334ce98fdf92fe69eeb4bb2e190dc65b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_4/order_1.txt @@ -0,0 +1 @@ +F. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_4/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..943b4511334ce98fdf92fe69eeb4bb2e190dc65b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_4/order_2.txt @@ -0,0 +1 @@ +F. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_4/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..943b4511334ce98fdf92fe69eeb4bb2e190dc65b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_4/order_3.txt @@ -0,0 +1 @@ +F. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_4/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..943b4511334ce98fdf92fe69eeb4bb2e190dc65b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_4/order_4.txt @@ -0,0 +1 @@ +F. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_5/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a2ca98e544c8ec79e90d3a008e537e076df72ba7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_5/order_0.txt @@ -0,0 +1 @@ +K. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_5/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a2ca98e544c8ec79e90d3a008e537e076df72ba7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_5/order_1.txt @@ -0,0 +1 @@ +K. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_5/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a2ca98e544c8ec79e90d3a008e537e076df72ba7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_5/order_2.txt @@ -0,0 +1 @@ +K. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_5/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a2ca98e544c8ec79e90d3a008e537e076df72ba7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_5/order_3.txt @@ -0,0 +1 @@ +K. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_5/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a2ca98e544c8ec79e90d3a008e537e076df72ba7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_5/order_4.txt @@ -0,0 +1 @@ +K. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_6/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..88c6cde00a2062fc41230f0c8c5b0d074e2ae428 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_6/order_0.txt @@ -0,0 +1 @@ +C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_6/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a88b89d90b7808511acfff8cb8907a798bfce2bf --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_6/order_1.txt @@ -0,0 +1 @@ +B. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_6/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a88b89d90b7808511acfff8cb8907a798bfce2bf --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_6/order_2.txt @@ -0,0 +1 @@ +B. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_6/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a88b89d90b7808511acfff8cb8907a798bfce2bf --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_6/order_3.txt @@ -0,0 +1 @@ +B. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_6/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..88c6cde00a2062fc41230f0c8c5b0d074e2ae428 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_6/order_4.txt @@ -0,0 +1 @@ +C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_7/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..015351113d53d8f675d4a27b1e6430027a32ba93 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_7/order_0.txt @@ -0,0 +1 @@ +A. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_7/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..015351113d53d8f675d4a27b1e6430027a32ba93 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_7/order_1.txt @@ -0,0 +1 @@ +A. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_7/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..015351113d53d8f675d4a27b1e6430027a32ba93 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_7/order_2.txt @@ -0,0 +1 @@ +A. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_7/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..015351113d53d8f675d4a27b1e6430027a32ba93 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_7/order_3.txt @@ -0,0 +1 @@ +A. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_7/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..015351113d53d8f675d4a27b1e6430027a32ba93 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_7/order_4.txt @@ -0,0 +1 @@ +A. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_8/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3d9f34a74d7e0dd21c338db807c15dd2e76bdff3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_8/order_0.txt @@ -0,0 +1 @@ +K. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_8/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f181ff15a4a57e50a7053612f04d0023a2fd82c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_8/order_1.txt @@ -0,0 +1 @@ +N. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_8/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f181ff15a4a57e50a7053612f04d0023a2fd82c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_8/order_2.txt @@ -0,0 +1 @@ +N. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_8/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..3d9f34a74d7e0dd21c338db807c15dd2e76bdff3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_8/order_3.txt @@ -0,0 +1 @@ +K. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_8/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f181ff15a4a57e50a7053612f04d0023a2fd82c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_8/order_4.txt @@ -0,0 +1 @@ +N. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_9/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..bfa61fa12baaf33c98e718a430e48b0ce40790ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_9/order_0.txt @@ -0,0 +1 @@ +I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_9/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..bfa61fa12baaf33c98e718a430e48b0ce40790ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_9/order_1.txt @@ -0,0 +1 @@ +I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_9/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..bfa61fa12baaf33c98e718a430e48b0ce40790ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_9/order_2.txt @@ -0,0 +1 @@ +I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_9/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..bfa61fa12baaf33c98e718a430e48b0ce40790ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_9/order_3.txt @@ -0,0 +1 @@ +I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_9/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b29537478cfec01d43434ac400bba0b56384016 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/CoT/length_3/sample_9/order_4.txt @@ -0,0 +1 @@ +CONTENE_FILRER. \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_1/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba52ebad94a8694e71d1c61a1f5a610f6d159ad4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_1/order_0.txt @@ -0,0 +1 @@ +B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_1/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba52ebad94a8694e71d1c61a1f5a610f6d159ad4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_1/order_1.txt @@ -0,0 +1 @@ +B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_1/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b69df92f3e4ae537d548eadd49a8be18257e3ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_1/order_2.txt @@ -0,0 +1 @@ +A. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_1/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b69df92f3e4ae537d548eadd49a8be18257e3ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_1/order_3.txt @@ -0,0 +1 @@ +A. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_1/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b69df92f3e4ae537d548eadd49a8be18257e3ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_1/order_4.txt @@ -0,0 +1 @@ +A. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_10/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..47ddb6939398a9dfb3517850577fc6c19a139352 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_10/order_0.txt @@ -0,0 +1 @@ +B. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_10/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5232a3af3c291d3e68d5cf80b8d40b4bca541cd4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_10/order_1.txt @@ -0,0 +1 @@ +A. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_10/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5232a3af3c291d3e68d5cf80b8d40b4bca541cd4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_10/order_2.txt @@ -0,0 +1 @@ +A. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_10/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5232a3af3c291d3e68d5cf80b8d40b4bca541cd4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_10/order_3.txt @@ -0,0 +1 @@ +A. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_10/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5232a3af3c291d3e68d5cf80b8d40b4bca541cd4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_10/order_4.txt @@ -0,0 +1 @@ +A. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_11/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3bf7f8bd23f5e9776716245e0f154177f6fd1a7c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_11/order_0.txt @@ -0,0 +1 @@ +H. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_11/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5cc819aa574392d7d7507c98764deb0089020a35 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_11/order_1.txt @@ -0,0 +1 @@ +F. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_11/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6dc01f6af50983461439ef6ed20a6fc3f1fbbe1e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_11/order_2.txt @@ -0,0 +1 @@ +I. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_11/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6dc01f6af50983461439ef6ed20a6fc3f1fbbe1e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_11/order_3.txt @@ -0,0 +1 @@ +I. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_11/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6dc01f6af50983461439ef6ed20a6fc3f1fbbe1e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_11/order_4.txt @@ -0,0 +1 @@ +I. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_12/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..9814f89dd18447778d14a465ad075b896ec5e7ed --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_12/order_0.txt @@ -0,0 +1 @@ +O. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_12/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9814f89dd18447778d14a465ad075b896ec5e7ed --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_12/order_1.txt @@ -0,0 +1 @@ +O. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_12/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9814f89dd18447778d14a465ad075b896ec5e7ed --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_12/order_2.txt @@ -0,0 +1 @@ +O. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_12/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f181ff15a4a57e50a7053612f04d0023a2fd82c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_12/order_3.txt @@ -0,0 +1 @@ +N. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_12/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f181ff15a4a57e50a7053612f04d0023a2fd82c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_12/order_4.txt @@ -0,0 +1 @@ +N. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_13/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..30f3ff4afb936058eb189b8cecada7811428a9f1 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_13/order_0.txt @@ -0,0 +1 @@ +A. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_13/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..30f3ff4afb936058eb189b8cecada7811428a9f1 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_13/order_1.txt @@ -0,0 +1 @@ +A. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_13/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..30f3ff4afb936058eb189b8cecada7811428a9f1 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_13/order_2.txt @@ -0,0 +1 @@ +A. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_13/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..30f3ff4afb936058eb189b8cecada7811428a9f1 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_13/order_3.txt @@ -0,0 +1 @@ +A. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_13/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..30f3ff4afb936058eb189b8cecada7811428a9f1 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_13/order_4.txt @@ -0,0 +1 @@ +A. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_14/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..75fe7cde90ed25447460e5682dd53a849019409a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_14/order_0.txt @@ -0,0 +1 @@ +K. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_14/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..df4d2f0aa0d05d8b2d2b166031cec14855a43816 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_14/order_1.txt @@ -0,0 +1 @@ +N. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_14/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..df4d2f0aa0d05d8b2d2b166031cec14855a43816 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_14/order_2.txt @@ -0,0 +1 @@ +N. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_14/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..df4d2f0aa0d05d8b2d2b166031cec14855a43816 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_14/order_3.txt @@ -0,0 +1 @@ +N. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_14/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..75fe7cde90ed25447460e5682dd53a849019409a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_14/order_4.txt @@ -0,0 +1 @@ +K. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_15/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2825568621d7890e69cb953615fa9fe3bb85cc08 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_15/order_0.txt @@ -0,0 +1 @@ +L. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_15/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ce30660831f35a2a34207cded226e9a328d85947 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_15/order_1.txt @@ -0,0 +1 @@ +K. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_15/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ce30660831f35a2a34207cded226e9a328d85947 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_15/order_2.txt @@ -0,0 +1 @@ +K. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_15/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ce30660831f35a2a34207cded226e9a328d85947 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_15/order_3.txt @@ -0,0 +1 @@ +K. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_15/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ce30660831f35a2a34207cded226e9a328d85947 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_15/order_4.txt @@ -0,0 +1 @@ +K. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_16/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b33274f1e655f32271f6e9b6880f93884554a8ee --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_16/order_0.txt @@ -0,0 +1 @@ +L. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_16/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..f2a53fe2503e9a82622b6fa3f3aaf492e5ae79b8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_16/order_1.txt @@ -0,0 +1 @@ +O. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_16/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f2a53fe2503e9a82622b6fa3f3aaf492e5ae79b8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_16/order_2.txt @@ -0,0 +1 @@ +O. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_16/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..f2a53fe2503e9a82622b6fa3f3aaf492e5ae79b8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_16/order_3.txt @@ -0,0 +1 @@ +O. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_16/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..609cb595b035f9f1e95172a41da44d426dd13d0b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_16/order_4.txt @@ -0,0 +1 @@ +M. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_17/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2d5ba6aa8bf2c0477f95ef252b831c35fe134778 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_17/order_0.txt @@ -0,0 +1 @@ +J. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_17/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..6fbc45f9c95a0ade3b0bfd3c7b90df651c1ac429 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_17/order_1.txt @@ -0,0 +1 @@ +G. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_17/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..6fbc45f9c95a0ade3b0bfd3c7b90df651c1ac429 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_17/order_2.txt @@ -0,0 +1 @@ +G. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_17/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6fbc45f9c95a0ade3b0bfd3c7b90df651c1ac429 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_17/order_3.txt @@ -0,0 +1 @@ +G. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_17/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6fbc45f9c95a0ade3b0bfd3c7b90df651c1ac429 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_17/order_4.txt @@ -0,0 +1 @@ +G. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_18/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a21d819e017e6b559c9d1922fb8396976efd2b74 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_18/order_0.txt @@ -0,0 +1 @@ +D. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_18/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e5f5c74df07ffa4d8e7ff469ceb806ff648f1bae --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_18/order_1.txt @@ -0,0 +1 @@ +E. green_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_18/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a21d819e017e6b559c9d1922fb8396976efd2b74 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_18/order_2.txt @@ -0,0 +1 @@ +D. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_18/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a21d819e017e6b559c9d1922fb8396976efd2b74 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_18/order_3.txt @@ -0,0 +1 @@ +D. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_18/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a21d819e017e6b559c9d1922fb8396976efd2b74 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_18/order_4.txt @@ -0,0 +1 @@ +D. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_19/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e4fb14412f118011cf467f1356d7867174d0e3f0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_19/order_0.txt @@ -0,0 +1 @@ +D. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_19/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e4fb14412f118011cf467f1356d7867174d0e3f0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_19/order_1.txt @@ -0,0 +1 @@ +D. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_19/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e4fb14412f118011cf467f1356d7867174d0e3f0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_19/order_2.txt @@ -0,0 +1 @@ +D. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_19/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e6ee9c457800add97cc2ce4e8a9e0e7bb4d52625 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_19/order_3.txt @@ -0,0 +1 @@ +B. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_19/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..fa48a34ff5cc2df561791531f81dc0c3ff5a40e8 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_19/order_4.txt @@ -0,0 +1 @@ +A. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_2/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5232a3af3c291d3e68d5cf80b8d40b4bca541cd4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_2/order_0.txt @@ -0,0 +1 @@ +A. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_2/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5232a3af3c291d3e68d5cf80b8d40b4bca541cd4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_2/order_1.txt @@ -0,0 +1 @@ +A. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_2/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5232a3af3c291d3e68d5cf80b8d40b4bca541cd4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_2/order_2.txt @@ -0,0 +1 @@ +A. blue_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_2/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2bc6cf23d90b1b6e24f4327190e7de06b355588d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_2/order_3.txt @@ -0,0 +1 @@ +E. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_2/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2bc6cf23d90b1b6e24f4327190e7de06b355588d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_2/order_4.txt @@ -0,0 +1 @@ +E. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_20/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..22faaa3463fee8b97741bfa08ad37f6d2d6bcdc2 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_20/order_0.txt @@ -0,0 +1 @@ +O. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_20/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..618eef651c5d5adfa784840551836610ee9825d0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_20/order_1.txt @@ -0,0 +1 @@ +N. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_20/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..618eef651c5d5adfa784840551836610ee9825d0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_20/order_2.txt @@ -0,0 +1 @@ +N. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_20/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..618eef651c5d5adfa784840551836610ee9825d0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_20/order_3.txt @@ -0,0 +1 @@ +N. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_20/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..618eef651c5d5adfa784840551836610ee9825d0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_20/order_4.txt @@ -0,0 +1 @@ +N. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_3/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7a695f1bd8998a8d41f54413ed8d9af9bffb483d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_3/order_0.txt @@ -0,0 +1 @@ +E. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_3/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7a695f1bd8998a8d41f54413ed8d9af9bffb483d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_3/order_1.txt @@ -0,0 +1 @@ +E. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_3/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca23c126bfc9159d60ba7dad014d7d5919b8274c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_3/order_2.txt @@ -0,0 +1 @@ +B. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_3/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca23c126bfc9159d60ba7dad014d7d5919b8274c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_3/order_3.txt @@ -0,0 +1 @@ +B. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_3/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..49ccbbff2467c29135cb108bd90e4fb567ec4f3b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_3/order_4.txt @@ -0,0 +1 @@ +C. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_4/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..02867678b8550f616b6632800638fdc3fa45d42f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_4/order_0.txt @@ -0,0 +1 @@ +L. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_4/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..02867678b8550f616b6632800638fdc3fa45d42f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_4/order_1.txt @@ -0,0 +1 @@ +L. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_4/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..02867678b8550f616b6632800638fdc3fa45d42f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_4/order_2.txt @@ -0,0 +1 @@ +L. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_4/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..02867678b8550f616b6632800638fdc3fa45d42f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_4/order_3.txt @@ -0,0 +1 @@ +L. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_4/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..02867678b8550f616b6632800638fdc3fa45d42f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_4/order_4.txt @@ -0,0 +1 @@ +L. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_5/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e1abfa38ec1d41da58d87dc2defcb46dba2ece31 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_5/order_0.txt @@ -0,0 +1 @@ +L. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_5/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e1abfa38ec1d41da58d87dc2defcb46dba2ece31 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_5/order_1.txt @@ -0,0 +1 @@ +L. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_5/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..fc09885bebc5dbde8e43902e023f8244b169fc8f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_5/order_2.txt @@ -0,0 +1 @@ +N. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_5/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..fc09885bebc5dbde8e43902e023f8244b169fc8f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_5/order_3.txt @@ -0,0 +1 @@ +N. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_5/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e1abfa38ec1d41da58d87dc2defcb46dba2ece31 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_5/order_4.txt @@ -0,0 +1 @@ +L. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_6/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..bb06a6162d999715b50ce2be0fad85f946e5ca64 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_6/order_0.txt @@ -0,0 +1 @@ +C. green_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_6/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a06d7d0ca7d74102d3b9ce2351bb405e30a4e4f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_6/order_1.txt @@ -0,0 +1 @@ +B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_6/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a06d7d0ca7d74102d3b9ce2351bb405e30a4e4f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_6/order_2.txt @@ -0,0 +1 @@ +B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_6/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a06d7d0ca7d74102d3b9ce2351bb405e30a4e4f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_6/order_3.txt @@ -0,0 +1 @@ +B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_6/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a06d7d0ca7d74102d3b9ce2351bb405e30a4e4f6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_6/order_4.txt @@ -0,0 +1 @@ +B. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_7/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..62aaddb4e2403b47e88ee1a9f651ab88fce88bc7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_7/order_0.txt @@ -0,0 +1 @@ +N. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_7/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..62aaddb4e2403b47e88ee1a9f651ab88fce88bc7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_7/order_1.txt @@ -0,0 +1 @@ +N. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_7/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..62aaddb4e2403b47e88ee1a9f651ab88fce88bc7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_7/order_2.txt @@ -0,0 +1 @@ +N. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_7/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..62aaddb4e2403b47e88ee1a9f651ab88fce88bc7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_7/order_3.txt @@ -0,0 +1 @@ +N. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_7/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..62aaddb4e2403b47e88ee1a9f651ab88fce88bc7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_7/order_4.txt @@ -0,0 +1 @@ +N. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_8/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..bdba658c9e0d8aa110868a4f4bc461e2b0c73ca5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_8/order_0.txt @@ -0,0 +1 @@ +K. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_8/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d7440574279100430f3674ddc8c64d31888cf355 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_8/order_1.txt @@ -0,0 +1 @@ +L. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_8/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d7440574279100430f3674ddc8c64d31888cf355 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_8/order_2.txt @@ -0,0 +1 @@ +L. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_8/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..bdba658c9e0d8aa110868a4f4bc461e2b0c73ca5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_8/order_3.txt @@ -0,0 +1 @@ +K. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_8/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..bdba658c9e0d8aa110868a4f4bc461e2b0c73ca5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_8/order_4.txt @@ -0,0 +1 @@ +K. red_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_9/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d8517557ef31e52857cac921f7e9f6f8f1285e2e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_9/order_0.txt @@ -0,0 +1 @@ +F. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_9/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ee3e75a3e2959d95b9db39cbf25e15f18046baec --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_9/order_1.txt @@ -0,0 +1 @@ +G. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_9/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ee3e75a3e2959d95b9db39cbf25e15f18046baec --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_9/order_2.txt @@ -0,0 +1 @@ +G. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_9/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ee3e75a3e2959d95b9db39cbf25e15f18046baec --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_9/order_3.txt @@ -0,0 +1 @@ +G. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_9/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d8517557ef31e52857cac921f7e9f6f8f1285e2e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_1/sample_9/order_4.txt @@ -0,0 +1 @@ +F. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_1/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fa5a3dbd005b6451278e75e045c0fd05ccf1608f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_1/order_0.txt @@ -0,0 +1 @@ +F. green_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_1/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..8297445e8078b7b5d79a61bd6a320cb1831e57bb --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_1/order_1.txt @@ -0,0 +1 @@ +G. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_1/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8297445e8078b7b5d79a61bd6a320cb1831e57bb --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_1/order_2.txt @@ -0,0 +1 @@ +G. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_1/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8297445e8078b7b5d79a61bd6a320cb1831e57bb --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_1/order_3.txt @@ -0,0 +1 @@ +G. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_1/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8297445e8078b7b5d79a61bd6a320cb1831e57bb --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_1/order_4.txt @@ -0,0 +1 @@ +G. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_10/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fed6f6d9bdfb1d41fc48e5b1783750e5c5a20d7e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_10/order_0.txt @@ -0,0 +1 @@ +K. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_10/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..64006cf08eb706664a17d92233835d355970b048 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_10/order_1.txt @@ -0,0 +1 @@ +L. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_10/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8cd50425785fdfdc4875e9a4478137f1290aedcf --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_10/order_2.txt @@ -0,0 +1 @@ +M. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_10/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8cd50425785fdfdc4875e9a4478137f1290aedcf --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_10/order_3.txt @@ -0,0 +1 @@ +M. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_10/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8cd50425785fdfdc4875e9a4478137f1290aedcf --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_10/order_4.txt @@ -0,0 +1 @@ +M. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_11/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f7b160edac53a3700f2144795a223fb848c9e6d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_11/order_0.txt @@ -0,0 +1 @@ +A. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_11/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f7b160edac53a3700f2144795a223fb848c9e6d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_11/order_1.txt @@ -0,0 +1 @@ +A. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_11/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4e3051b728132ab1a5b0b97dddd07dfc48e88fd6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_11/order_2.txt @@ -0,0 +1 @@ +E. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_11/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f7b160edac53a3700f2144795a223fb848c9e6d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_11/order_3.txt @@ -0,0 +1 @@ +A. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_11/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..8b790f864d1c3d98410f55937aecd07ff47dc4c1 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_11/order_4.txt @@ -0,0 +1 @@ +B. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_12/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d44620b08fb34b5a19f2f46ce51467304f010018 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_12/order_0.txt @@ -0,0 +1 @@ +L. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_12/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..939b93d185a7aab7fbead0bd24d18a54824341e4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_12/order_1.txt @@ -0,0 +1 @@ +O. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_12/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..939b93d185a7aab7fbead0bd24d18a54824341e4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_12/order_2.txt @@ -0,0 +1 @@ +O. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_12/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d44620b08fb34b5a19f2f46ce51467304f010018 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_12/order_3.txt @@ -0,0 +1 @@ +L. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_12/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..939b93d185a7aab7fbead0bd24d18a54824341e4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_12/order_4.txt @@ -0,0 +1 @@ +O. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_13/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..df794401fc59db930b5a360374ce899b74a05c44 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_13/order_0.txt @@ -0,0 +1 @@ +A. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_13/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..df794401fc59db930b5a360374ce899b74a05c44 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_13/order_1.txt @@ -0,0 +1 @@ +A. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_13/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..df794401fc59db930b5a360374ce899b74a05c44 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_13/order_2.txt @@ -0,0 +1 @@ +A. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_13/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..df794401fc59db930b5a360374ce899b74a05c44 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_13/order_3.txt @@ -0,0 +1 @@ +A. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_13/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..df794401fc59db930b5a360374ce899b74a05c44 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_13/order_4.txt @@ -0,0 +1 @@ +A. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_14/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c19b723e4927ca12fdd55a5f537ef0554730637 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_14/order_0.txt @@ -0,0 +1 @@ +L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_14/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c19b723e4927ca12fdd55a5f537ef0554730637 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_14/order_1.txt @@ -0,0 +1 @@ +L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_14/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c19b723e4927ca12fdd55a5f537ef0554730637 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_14/order_2.txt @@ -0,0 +1 @@ +L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_14/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c19b723e4927ca12fdd55a5f537ef0554730637 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_14/order_3.txt @@ -0,0 +1 @@ +L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_14/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..5c19b723e4927ca12fdd55a5f537ef0554730637 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_14/order_4.txt @@ -0,0 +1 @@ +L. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_15/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..e4fb14412f118011cf467f1356d7867174d0e3f0 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_15/order_0.txt @@ -0,0 +1 @@ +D. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_15/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..49b699df98f863744ce461d2b1639bb4168ce27b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_15/order_1.txt @@ -0,0 +1 @@ +A. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_15/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..49b699df98f863744ce461d2b1639bb4168ce27b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_15/order_2.txt @@ -0,0 +1 @@ +A. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_15/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..49b699df98f863744ce461d2b1639bb4168ce27b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_15/order_3.txt @@ -0,0 +1 @@ +A. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_15/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..49b699df98f863744ce461d2b1639bb4168ce27b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_15/order_4.txt @@ -0,0 +1 @@ +A. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_16/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba52ebad94a8694e71d1c61a1f5a610f6d159ad4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_16/order_0.txt @@ -0,0 +1 @@ +B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_16/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba52ebad94a8694e71d1c61a1f5a610f6d159ad4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_16/order_1.txt @@ -0,0 +1 @@ +B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_16/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..61f7ffb8f54e8b5bdc2133a560152dca8de2f273 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_16/order_2.txt @@ -0,0 +1 @@ +C. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_16/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba52ebad94a8694e71d1c61a1f5a610f6d159ad4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_16/order_3.txt @@ -0,0 +1 @@ +B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_16/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ba52ebad94a8694e71d1c61a1f5a610f6d159ad4 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_16/order_4.txt @@ -0,0 +1 @@ +B. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_17/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..87f7e79c16f9fac8b9ca168a8d33744137a201d6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_17/order_0.txt @@ -0,0 +1 @@ +K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_17/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..87f7e79c16f9fac8b9ca168a8d33744137a201d6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_17/order_1.txt @@ -0,0 +1 @@ +K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_17/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..f7d6fc5d75cd980666a077197be37487433e7dff --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_17/order_2.txt @@ -0,0 +1 @@ +J. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_17/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c8924966fb5d035b25e00e268f222224e66cb2be --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_17/order_3.txt @@ -0,0 +1 @@ +G. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_17/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..87f7e79c16f9fac8b9ca168a8d33744137a201d6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_17/order_4.txt @@ -0,0 +1 @@ +K. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_18/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..05f1ca84379afba3daf58afe69aebe289fb5be4e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_18/order_0.txt @@ -0,0 +1 @@ +M. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_18/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..fbf683925d6a1976c70d94d413eca790154de671 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_18/order_1.txt @@ -0,0 +1 @@ +O. red_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_18/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2a95c9fd92409f2869c9663f6c0c603506de4e55 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_18/order_2.txt @@ -0,0 +1 @@ +L. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_18/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2a95c9fd92409f2869c9663f6c0c603506de4e55 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_18/order_3.txt @@ -0,0 +1 @@ +L. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_18/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2a95c9fd92409f2869c9663f6c0c603506de4e55 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_18/order_4.txt @@ -0,0 +1 @@ +L. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_19/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b148e5546555d8499c461ba36bf1d86a70a40bb --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_19/order_0.txt @@ -0,0 +1 @@ +I. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_19/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b148e5546555d8499c461ba36bf1d86a70a40bb --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_19/order_1.txt @@ -0,0 +1 @@ +I. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_19/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..693b5c71027d3e30e3ab963c96d7409907cd7811 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_19/order_2.txt @@ -0,0 +1 @@ +J. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_19/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b148e5546555d8499c461ba36bf1d86a70a40bb --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_19/order_3.txt @@ -0,0 +1 @@ +I. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_19/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2b148e5546555d8499c461ba36bf1d86a70a40bb --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_19/order_4.txt @@ -0,0 +1 @@ +I. blue_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_2/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d59fe2a8c4b4c5cf56a5b2bfe680115234a2c8d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_2/order_0.txt @@ -0,0 +1 @@ +O. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_2/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d59fe2a8c4b4c5cf56a5b2bfe680115234a2c8d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_2/order_1.txt @@ -0,0 +1 @@ +O. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_2/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d59fe2a8c4b4c5cf56a5b2bfe680115234a2c8d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_2/order_2.txt @@ -0,0 +1 @@ +O. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_2/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d59fe2a8c4b4c5cf56a5b2bfe680115234a2c8d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_2/order_3.txt @@ -0,0 +1 @@ +O. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_2/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d59fe2a8c4b4c5cf56a5b2bfe680115234a2c8d9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_2/order_4.txt @@ -0,0 +1 @@ +O. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_20/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..488aaf0ea72cc1051111b2320743a8a387c42d17 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_20/order_0.txt @@ -0,0 +1 @@ +B. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_20/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..488aaf0ea72cc1051111b2320743a8a387c42d17 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_20/order_1.txt @@ -0,0 +1 @@ +B. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_20/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..015351113d53d8f675d4a27b1e6430027a32ba93 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_20/order_2.txt @@ -0,0 +1 @@ +A. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_20/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..488aaf0ea72cc1051111b2320743a8a387c42d17 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_20/order_3.txt @@ -0,0 +1 @@ +B. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_20/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..488aaf0ea72cc1051111b2320743a8a387c42d17 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_20/order_4.txt @@ -0,0 +1 @@ +B. blue_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_3/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..78e73a8947e4fad4f25d4b47ff2492c457d8ef2a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_3/order_0.txt @@ -0,0 +1 @@ +B. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_3/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..78e73a8947e4fad4f25d4b47ff2492c457d8ef2a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_3/order_1.txt @@ -0,0 +1 @@ +B. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_3/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8d2c657898f6b513440be1e7ef80b7f0d2e8616f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_3/order_2.txt @@ -0,0 +1 @@ +A. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_3/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..8d2c657898f6b513440be1e7ef80b7f0d2e8616f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_3/order_3.txt @@ -0,0 +1 @@ +A. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_3/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..4335a90ed52448b1c74f7e44bf700126ef75d6dd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_3/order_4.txt @@ -0,0 +1 @@ +C. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_4/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b83503e475d1b3d7e1c2943073eda45600de4cd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_4/order_0.txt @@ -0,0 +1 @@ +G. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_4/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b83503e475d1b3d7e1c2943073eda45600de4cd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_4/order_1.txt @@ -0,0 +1 @@ +G. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_4/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b83503e475d1b3d7e1c2943073eda45600de4cd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_4/order_2.txt @@ -0,0 +1 @@ +G. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_4/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b83503e475d1b3d7e1c2943073eda45600de4cd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_4/order_3.txt @@ -0,0 +1 @@ +G. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_4/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7b83503e475d1b3d7e1c2943073eda45600de4cd --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_4/order_4.txt @@ -0,0 +1 @@ +G. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_5/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4086abca9d1f30bdfe5e2aad93bcd80b00fb60b7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_5/order_0.txt @@ -0,0 +1 @@ +F. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_5/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b4d1859d8f8904d5c67f162460d762b97b345446 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_5/order_1.txt @@ -0,0 +1 @@ +I. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_5/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b4d1859d8f8904d5c67f162460d762b97b345446 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_5/order_2.txt @@ -0,0 +1 @@ +I. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_5/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b4d1859d8f8904d5c67f162460d762b97b345446 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_5/order_3.txt @@ -0,0 +1 @@ +I. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_5/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b4d1859d8f8904d5c67f162460d762b97b345446 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_5/order_4.txt @@ -0,0 +1 @@ +I. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_6/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2825568621d7890e69cb953615fa9fe3bb85cc08 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_6/order_0.txt @@ -0,0 +1 @@ +L. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_6/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2825568621d7890e69cb953615fa9fe3bb85cc08 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_6/order_1.txt @@ -0,0 +1 @@ +L. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_6/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..2825568621d7890e69cb953615fa9fe3bb85cc08 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_6/order_2.txt @@ -0,0 +1 @@ +L. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_6/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..2825568621d7890e69cb953615fa9fe3bb85cc08 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_6/order_3.txt @@ -0,0 +1 @@ +L. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_6/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..2825568621d7890e69cb953615fa9fe3bb85cc08 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_6/order_4.txt @@ -0,0 +1 @@ +L. red_basket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_7/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc4496397c4fd9939c7b8c5daa933392a440380a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_7/order_0.txt @@ -0,0 +1 @@ +B. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_7/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc4496397c4fd9939c7b8c5daa933392a440380a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_7/order_1.txt @@ -0,0 +1 @@ +B. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_7/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc4496397c4fd9939c7b8c5daa933392a440380a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_7/order_2.txt @@ -0,0 +1 @@ +B. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_7/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc4496397c4fd9939c7b8c5daa933392a440380a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_7/order_3.txt @@ -0,0 +1 @@ +B. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_7/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..cc4496397c4fd9939c7b8c5daa933392a440380a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_7/order_4.txt @@ -0,0 +1 @@ +B. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_8/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5700c4e42b3290f90ce8432ca9e1723cbcf39b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_8/order_0.txt @@ -0,0 +1 @@ +A. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_8/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5700c4e42b3290f90ce8432ca9e1723cbcf39b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_8/order_1.txt @@ -0,0 +1 @@ +A. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_8/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5700c4e42b3290f90ce8432ca9e1723cbcf39b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_8/order_2.txt @@ -0,0 +1 @@ +A. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_8/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5700c4e42b3290f90ce8432ca9e1723cbcf39b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_8/order_3.txt @@ -0,0 +1 @@ +A. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_8/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d5700c4e42b3290f90ce8432ca9e1723cbcf39b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_8/order_4.txt @@ -0,0 +1 @@ +A. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_9/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..d987bc2d531e93dfaedbc698b4d56e24efaa78b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_9/order_0.txt @@ -0,0 +1 @@ +D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_9/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..d987bc2d531e93dfaedbc698b4d56e24efaa78b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_9/order_1.txt @@ -0,0 +1 @@ +D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_9/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..d987bc2d531e93dfaedbc698b4d56e24efaa78b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_9/order_2.txt @@ -0,0 +1 @@ +D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_9/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..d987bc2d531e93dfaedbc698b4d56e24efaa78b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_9/order_3.txt @@ -0,0 +1 @@ +D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_9/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..d987bc2d531e93dfaedbc698b4d56e24efaa78b3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_2/sample_9/order_4.txt @@ -0,0 +1 @@ +D. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_1/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_1/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..5113c76389d7563e77d6ebf6a73b5238743ae3f5 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_1/order_0.txt @@ -0,0 +1 @@ +M. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_1/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_1/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..c39318e0d7b091934dc635601522baf995cfb42c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_1/order_1.txt @@ -0,0 +1 @@ +A. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_1/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_1/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..c39318e0d7b091934dc635601522baf995cfb42c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_1/order_2.txt @@ -0,0 +1 @@ +A. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_1/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_1/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..c39318e0d7b091934dc635601522baf995cfb42c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_1/order_3.txt @@ -0,0 +1 @@ +A. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_1/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_1/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..c39318e0d7b091934dc635601522baf995cfb42c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_1/order_4.txt @@ -0,0 +1 @@ +A. blue_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_10/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_10/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..fed83117e891372f464f3c40ccde41cfb16e5c8a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_10/order_0.txt @@ -0,0 +1 @@ +A. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_10/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_10/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9574b0a41522c19a313f28691f9380d3619ac68d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_10/order_1.txt @@ -0,0 +1 @@ +C. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_10/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_10/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9574b0a41522c19a313f28691f9380d3619ac68d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_10/order_2.txt @@ -0,0 +1 @@ +C. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_10/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_10/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..fed83117e891372f464f3c40ccde41cfb16e5c8a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_10/order_3.txt @@ -0,0 +1 @@ +A. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_10/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_10/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..fed83117e891372f464f3c40ccde41cfb16e5c8a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_10/order_4.txt @@ -0,0 +1 @@ +A. green_bathtub \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_11/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_11/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..878a7d421efdd6bdbc2a315961eb3e55b2a8e367 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_11/order_0.txt @@ -0,0 +1 @@ +F. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_11/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_11/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..878a7d421efdd6bdbc2a315961eb3e55b2a8e367 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_11/order_1.txt @@ -0,0 +1 @@ +F. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_11/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_11/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..878a7d421efdd6bdbc2a315961eb3e55b2a8e367 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_11/order_2.txt @@ -0,0 +1 @@ +F. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_11/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_11/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..878a7d421efdd6bdbc2a315961eb3e55b2a8e367 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_11/order_3.txt @@ -0,0 +1 @@ +F. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_11/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_11/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..878a7d421efdd6bdbc2a315961eb3e55b2a8e367 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_11/order_4.txt @@ -0,0 +1 @@ +F. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_12/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_12/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..058f980e2760c76b2abeadc524c2b6604677bc0f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_12/order_0.txt @@ -0,0 +1 @@ +L. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_12/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_12/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..058f980e2760c76b2abeadc524c2b6604677bc0f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_12/order_1.txt @@ -0,0 +1 @@ +L. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_12/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_12/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..058f980e2760c76b2abeadc524c2b6604677bc0f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_12/order_2.txt @@ -0,0 +1 @@ +L. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_12/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_12/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..058f980e2760c76b2abeadc524c2b6604677bc0f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_12/order_3.txt @@ -0,0 +1 @@ +L. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_12/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_12/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..058f980e2760c76b2abeadc524c2b6604677bc0f --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_12/order_4.txt @@ -0,0 +1 @@ +L. green_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_13/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_13/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..beafdfe4e6806eeee4e2c87ec3c2b9d23429c83d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_13/order_0.txt @@ -0,0 +1 @@ +B. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_13/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_13/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..59ccd1db21b7ec169432ce8dd79c602dbd3be44d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_13/order_1.txt @@ -0,0 +1 @@ +D. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_13/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_13/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..59ccd1db21b7ec169432ce8dd79c602dbd3be44d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_13/order_2.txt @@ -0,0 +1 @@ +D. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_13/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_13/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..59ccd1db21b7ec169432ce8dd79c602dbd3be44d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_13/order_3.txt @@ -0,0 +1 @@ +D. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_13/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_13/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..59ccd1db21b7ec169432ce8dd79c602dbd3be44d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_13/order_4.txt @@ -0,0 +1 @@ +D. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_14/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_14/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..f553425c3c153ff8d9a359bf2b304904e8886da9 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_14/order_0.txt @@ -0,0 +1 @@ +M. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_14/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_14/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca060d653221b07ac01cfe59ee63187514632c59 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_14/order_1.txt @@ -0,0 +1 @@ +L. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_14/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_14/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca060d653221b07ac01cfe59ee63187514632c59 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_14/order_2.txt @@ -0,0 +1 @@ +L. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_14/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_14/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca060d653221b07ac01cfe59ee63187514632c59 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_14/order_3.txt @@ -0,0 +1 @@ +L. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_14/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_14/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca060d653221b07ac01cfe59ee63187514632c59 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_14/order_4.txt @@ -0,0 +1 @@ +L. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_15/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_15/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..2712dd86946df8149ff6bc89a44c36aabfa00ca7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_15/order_0.txt @@ -0,0 +1 @@ +N. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_15/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_15/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..2712dd86946df8149ff6bc89a44c36aabfa00ca7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_15/order_1.txt @@ -0,0 +1 @@ +N. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_15/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_15/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..83a6f1763c259bdda93d6f2d83c3c8ffe500b77a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_15/order_2.txt @@ -0,0 +1 @@ +K. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_15/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_15/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..83a6f1763c259bdda93d6f2d83c3c8ffe500b77a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_15/order_3.txt @@ -0,0 +1 @@ +K. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_15/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_15/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..83a6f1763c259bdda93d6f2d83c3c8ffe500b77a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_15/order_4.txt @@ -0,0 +1 @@ +K. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_16/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_16/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..4eff4b66d1d499003fdc679860edf7f9a4571031 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_16/order_0.txt @@ -0,0 +1 @@ +J. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_16/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_16/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4eff4b66d1d499003fdc679860edf7f9a4571031 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_16/order_1.txt @@ -0,0 +1 @@ +J. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_16/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_16/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..67e1be4be039844f264ce66827a12f1bc0793074 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_16/order_2.txt @@ -0,0 +1 @@ +F. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_16/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_16/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..67e1be4be039844f264ce66827a12f1bc0793074 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_16/order_3.txt @@ -0,0 +1 @@ +F. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_16/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_16/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..67e1be4be039844f264ce66827a12f1bc0793074 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_16/order_4.txt @@ -0,0 +1 @@ +F. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_17/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_17/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..beafdfe4e6806eeee4e2c87ec3c2b9d23429c83d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_17/order_0.txt @@ -0,0 +1 @@ +B. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_17/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_17/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..e03a4a3d9c4d1cf377409ed3b7dc70e6ae3a3a15 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_17/order_1.txt @@ -0,0 +1 @@ +D. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_17/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_17/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e03a4a3d9c4d1cf377409ed3b7dc70e6ae3a3a15 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_17/order_2.txt @@ -0,0 +1 @@ +D. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_17/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_17/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..e03a4a3d9c4d1cf377409ed3b7dc70e6ae3a3a15 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_17/order_3.txt @@ -0,0 +1 @@ +D. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_17/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_17/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..e03a4a3d9c4d1cf377409ed3b7dc70e6ae3a3a15 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_17/order_4.txt @@ -0,0 +1 @@ +D. red_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_18/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_18/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..6428f74b867b409891ada024b90f1bd4f6f5c74d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_18/order_0.txt @@ -0,0 +1 @@ +G. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_18/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_18/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a62f6676f90611c800ac1361674dd590b38e1d3a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_18/order_1.txt @@ -0,0 +1 @@ +F. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_18/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_18/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a62f6676f90611c800ac1361674dd590b38e1d3a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_18/order_2.txt @@ -0,0 +1 @@ +F. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_18/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_18/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a62f6676f90611c800ac1361674dd590b38e1d3a --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_18/order_3.txt @@ -0,0 +1 @@ +F. green_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_18/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_18/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..6428f74b867b409891ada024b90f1bd4f6f5c74d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_18/order_4.txt @@ -0,0 +1 @@ +G. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_19/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_19/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_19/order_0.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_19/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_19/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_19/order_1.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_19/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_19/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_19/order_2.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_19/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_19/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_19/order_3.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_19/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_19/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b76c614f5e4757b26a63f1960e48b5ab831e9230 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_19/order_4.txt @@ -0,0 +1 @@ +L. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_2/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_2/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..092e465946c9c0e7565338ef5a8f8a1c7daad59e --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_2/order_0.txt @@ -0,0 +1 @@ +E. green_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_2/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_2/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..b224627a040883f2a072f3579eba47d329376210 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_2/order_1.txt @@ -0,0 +1 @@ +D. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_2/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_2/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b224627a040883f2a072f3579eba47d329376210 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_2/order_2.txt @@ -0,0 +1 @@ +D. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_2/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_2/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..b224627a040883f2a072f3579eba47d329376210 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_2/order_3.txt @@ -0,0 +1 @@ +D. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_2/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_2/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b224627a040883f2a072f3579eba47d329376210 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_2/order_4.txt @@ -0,0 +1 @@ +D. blue_suitcase \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_20/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_20/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..273a2ef88e852179c5ca093b91bae0b321096229 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_20/order_0.txt @@ -0,0 +1 @@ +I. red_envelope \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_20/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_20/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..4eff4b66d1d499003fdc679860edf7f9a4571031 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_20/order_1.txt @@ -0,0 +1 @@ +J. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_20/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_20/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4eff4b66d1d499003fdc679860edf7f9a4571031 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_20/order_2.txt @@ -0,0 +1 @@ +J. blue_cupboard \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_20/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_20/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..7308cff673960e58655c0fa2933972df7f319f46 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_20/order_3.txt @@ -0,0 +1 @@ +H. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_20/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_20/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..7308cff673960e58655c0fa2933972df7f319f46 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_20/order_4.txt @@ -0,0 +1 @@ +H. blue_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_3/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_3/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..cea0ef33c2fc9d542c68187afdc1af7f6da3b292 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_3/order_0.txt @@ -0,0 +1 @@ +O. green_crate \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_3/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_3/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..69f15ecdbc95f827e35e0f461a8c8a87111ac68b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_3/order_1.txt @@ -0,0 +1 @@ +M. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_3/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_3/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..9b29537478cfec01d43434ac400bba0b56384016 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_3/order_2.txt @@ -0,0 +1 @@ +CONTENE_FILRER. \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_3/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_3/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..69f15ecdbc95f827e35e0f461a8c8a87111ac68b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_3/order_3.txt @@ -0,0 +1 @@ +M. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_3/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_3/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..69f15ecdbc95f827e35e0f461a8c8a87111ac68b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_3/order_4.txt @@ -0,0 +1 @@ +M. red_drawer \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_4/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_4/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..943b4511334ce98fdf92fe69eeb4bb2e190dc65b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_4/order_0.txt @@ -0,0 +1 @@ +F. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_4/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_4/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..943b4511334ce98fdf92fe69eeb4bb2e190dc65b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_4/order_1.txt @@ -0,0 +1 @@ +F. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_4/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_4/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..943b4511334ce98fdf92fe69eeb4bb2e190dc65b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_4/order_2.txt @@ -0,0 +1 @@ +F. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_4/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_4/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..943b4511334ce98fdf92fe69eeb4bb2e190dc65b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_4/order_3.txt @@ -0,0 +1 @@ +F. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_4/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_4/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..943b4511334ce98fdf92fe69eeb4bb2e190dc65b --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_4/order_4.txt @@ -0,0 +1 @@ +F. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_5/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_5/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..a2ca98e544c8ec79e90d3a008e537e076df72ba7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_5/order_0.txt @@ -0,0 +1 @@ +K. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_5/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_5/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a2ca98e544c8ec79e90d3a008e537e076df72ba7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_5/order_1.txt @@ -0,0 +1 @@ +K. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_5/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_5/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a2ca98e544c8ec79e90d3a008e537e076df72ba7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_5/order_2.txt @@ -0,0 +1 @@ +K. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_5/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_5/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..a2ca98e544c8ec79e90d3a008e537e076df72ba7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_5/order_3.txt @@ -0,0 +1 @@ +K. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_5/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_5/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..a2ca98e544c8ec79e90d3a008e537e076df72ba7 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_5/order_4.txt @@ -0,0 +1 @@ +K. red_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_6/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_6/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..88c6cde00a2062fc41230f0c8c5b0d074e2ae428 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_6/order_0.txt @@ -0,0 +1 @@ +C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_6/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_6/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..a88b89d90b7808511acfff8cb8907a798bfce2bf --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_6/order_1.txt @@ -0,0 +1 @@ +B. red_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_6/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_6/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..b252b740d943384f07c33e27e865865cb6430c3d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_6/order_2.txt @@ -0,0 +1 @@ +D. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_6/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_6/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..88c6cde00a2062fc41230f0c8c5b0d074e2ae428 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_6/order_3.txt @@ -0,0 +1 @@ +C. blue_bucket \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_6/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_6/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..b252b740d943384f07c33e27e865865cb6430c3d --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_6/order_4.txt @@ -0,0 +1 @@ +D. blue_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_7/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_7/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..015351113d53d8f675d4a27b1e6430027a32ba93 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_7/order_0.txt @@ -0,0 +1 @@ +A. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_7/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_7/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..015351113d53d8f675d4a27b1e6430027a32ba93 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_7/order_1.txt @@ -0,0 +1 @@ +A. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_7/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_7/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..015351113d53d8f675d4a27b1e6430027a32ba93 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_7/order_2.txt @@ -0,0 +1 @@ +A. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_7/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_7/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..015351113d53d8f675d4a27b1e6430027a32ba93 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_7/order_3.txt @@ -0,0 +1 @@ +A. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_7/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_7/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..015351113d53d8f675d4a27b1e6430027a32ba93 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_7/order_4.txt @@ -0,0 +1 @@ +A. green_bottle \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_8/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_8/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..3d9f34a74d7e0dd21c338db807c15dd2e76bdff3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_8/order_0.txt @@ -0,0 +1 @@ +K. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_8/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_8/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f181ff15a4a57e50a7053612f04d0023a2fd82c --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_8/order_1.txt @@ -0,0 +1 @@ +N. green_box \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_8/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_8/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..8a320ce22cc978c76c724052435c14f529ab03c6 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_8/order_2.txt @@ -0,0 +1 @@ +L. green_treasure_chest \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_8/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_8/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..3d9f34a74d7e0dd21c338db807c15dd2e76bdff3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_8/order_3.txt @@ -0,0 +1 @@ +K. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_8/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_8/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..3d9f34a74d7e0dd21c338db807c15dd2e76bdff3 --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_8/order_4.txt @@ -0,0 +1 @@ +K. red_pantry \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_9/order_0.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_9/order_0.txt new file mode 100644 index 0000000000000000000000000000000000000000..bfa61fa12baaf33c98e718a430e48b0ce40790ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_9/order_0.txt @@ -0,0 +1 @@ +I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_9/order_1.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_9/order_1.txt new file mode 100644 index 0000000000000000000000000000000000000000..bfa61fa12baaf33c98e718a430e48b0ce40790ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_9/order_1.txt @@ -0,0 +1 @@ +I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_9/order_2.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_9/order_2.txt new file mode 100644 index 0000000000000000000000000000000000000000..bfa61fa12baaf33c98e718a430e48b0ce40790ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_9/order_2.txt @@ -0,0 +1 @@ +I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_9/order_3.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_9/order_3.txt new file mode 100644 index 0000000000000000000000000000000000000000..bfa61fa12baaf33c98e718a430e48b0ce40790ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_9/order_3.txt @@ -0,0 +1 @@ +I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_9/order_4.txt b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_9/order_4.txt new file mode 100644 index 0000000000000000000000000000000000000000..bfa61fa12baaf33c98e718a430e48b0ce40790ef --- /dev/null +++ b/ToMh_dataset/extracted_response_original/Tell/MC/length_3/sample_9/order_4.txt @@ -0,0 +1 @@ +I. blue_container \ No newline at end of file diff --git a/ToMh_dataset/generate_prompts.py b/ToMh_dataset/generate_prompts.py new file mode 100644 index 0000000000000000000000000000000000000000..5b8a6c0f7b8af59fa5ba63fa45671b3476da1ed3 --- /dev/null +++ b/ToMh_dataset/generate_prompts.py @@ -0,0 +1,31 @@ +import os +import sys +import itertools + + +def main(): + input_folder = 'data_ToMh' + output_folder = 'prompt_ToMh' + lengths = [1, 2, 3] + orders = [0, 1, 2, 3, 4] + prompts = ['CoT', 'MC'] + tells = ['No_Tell', 'Tell'] + for tell, prompt, length, order, sample_num in itertools.product(tells, prompts, lengths, orders, range(1, 21)): + input_fn = os.path.join(input_folder, tell, prompt, f'length_{length}', f'sample_{sample_num}', + f'order_{order}.txt') + output_fn = os.path.join(output_folder, tell, prompt, f'length_{length}', f'sample_{sample_num}', + f'order_{order}.txt') + with open(input_fn, 'r') as file: + lines = file.readlines() + new_lines = [line for line in lines if line == + '\n' or line.split()[0] != 'Answer:'] + if not os.path.exists(os.path.join(output_folder, tell, prompt, f'length_{length}', f'sample_{sample_num}')): + os.makedirs(os.path.join(output_folder, tell, prompt, + f'length_{length}', f'sample_{sample_num}')) + with open(output_fn, 'w') as file: + file.writelines(new_lines) + + + +if __name__ == "__main__": + sys.exit(main()) diff --git a/ToMh_dataset/generate_tasks.py b/ToMh_dataset/generate_tasks.py new file mode 100644 index 0000000000000000000000000000000000000000..89f15c91f83e7c002a21c2e01c80940bd7bda69e --- /dev/null +++ b/ToMh_dataset/generate_tasks.py @@ -0,0 +1,180 @@ +import argparse +import logging +import glob +import numpy as np +import os +import sys +import random +import itertools + +from stringify import stringify +from tasks import Specify_Tasks +from utils import is_file, mkdir_p, remove_extension +from world import World + + +def generate_story_with_specified_chapters( + world_paths, output_dir_path, n, noise=0.1, train_noise=False, order=-1, num_chapter=-1, exist_tell_in_story=False, prompt='CoT', exist_answer=False +): # prompt is dummy + """Generates stories with guarantee that each task is seen n times.""" + mkdir_p(output_dir_path) + n = n[0] + + for world in world_paths: + + w = World() + w.load(world) + world_name = remove_extension(world) + + # Define task creator and task types + task = Specify_Tasks() + tasks_per_length = np.array([ + [('A5', True)], # 1 chapter + [('A5', False), ('A3', True)], # 2 chapters + [('A5', True), ('A3', False), ('A4', True)], # 3 chapters + [('A5', False), ('A3', True), + ('A4', False), ('A2', True)], # 4 chapters + ], dtype=object) + + # If order and num_chapter are not specified + orders = [0, 1, 2, 3, 4] if order == -1 else [order] + num_chapters = [1, 2, 3] if num_chapter == -1 else [num_chapter] + modes = ['MC', 'CoT'] + for length_of_story in num_chapters: + # Create folder to contain data + folder_name_2 = f'length_{length_of_story}' + logging.info("Creating New task in %s..." % folder_name_2) + + for i in range(1, n+1): + folder_name_3 = f'sample_{i}' + story = task.generate_story_qs_at_end( + w, length_of_story, tasks_per_length[length_of_story - + 1], num_agents=5, + num_locations=3, statement_noise=noise, order=0, exist_tell_in_story=exist_tell_in_story + ) # order = 0 is dummy here. + for mode in modes: + folder_name_1 = mode + for order_of_story in orders: + file_name = f'order_{order_of_story}.txt' + os.makedirs(os.path.join( + output_dir_path, folder_name_1, folder_name_2, folder_name_3), exist_ok=True) + path = os.path.join( + output_dir_path, folder_name_1, folder_name_2, folder_name_3, file_name) + + with open(path, 'w', encoding='utf-8') as f: + if mode == 'MC': + f.write( + 'The following story happens in chronological order. You will be given a multiple-choice question and a note at the end. Directly output the answer without explanation.\n') + else: + f.write( + 'The following story happens in chronological order. You will be given a multiple-choice question and a note at the end. First give step-by-step analysis about the question. Then output the answer.\n') + f.write('Story:\n') +<<<<<<< HEAD + f.write('\n'.join(stringify(story, exist_answer=exist_answer, order=order_of_story))) #exist_answer is dummy + f.write('\nNote: You should assume the following. (1) A character witnesses everything and every movements before exiting a location. (2) A character A can infer another character B\'s mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every character tend to lie. A character tend to trust a character that exited the room later than himself. (4) Agents in private communications know that others won\'t hear them, but anyone can hear any public claims. (5) What a character tells others does not affect his actual belief.\n') +======= + # exist_answer is dummy + f.write( + '\n'.join(stringify(story, exist_answer=exist_answer, order=order_of_story))) + f.write('\nNote: You should assume the following. (1) An agent witnesses everything and every movement before exiting a location. (2) An agent A can infer another agent B\'s mental state only if A and B have been in the same location, or have private or public interactions. (3) Note that every agent tends to lie. What an agent A tells others doesn\'t affect A\'s actual belief. An agent tends to trust an agent that exited the room later than himself. The exit order is known to all agents. (4) Agents in private communications know that others won\'t hear them, but they know that anyone can hear any public claims.\n') +>>>>>>> 50242d0343261b6c95293fc995711b384ff3c1fe + + +def parse_args(args): + + parser = argparse.ArgumentParser( + description='Process command-line arguments.' + ) + + parser.add_argument( + '-w', '--world_path', dest='world_paths', type=is_file, required=True, + action='append', help='Path to a world definition file' + ) + + parser.add_argument( + '-o', '--output_dir_path', dest='output_dir_path', type=mkdir_p, + default='data_ToMh', help='Output directory path' + ) + + # parser.add_argument( + # '-b', '--babi_dir_path', dest='babi_dir_path', type=str, required=True, + # help='Path to directory containing the 20 bAbi task train + test data' + # ) + + parser.add_argument( + '-l', '--logging', type=str, default='INFO', metavar='logging', + choices=['DEBUG', 'INFO', 'WARNING', 'ERROR', 'CRITICAL'], + help='Logging level' + ) + + parser.add_argument( + '-n', '--num_stories', dest='num_stories_choices', type=int, + action='append', required=True, + help='Number of stories (examples) in a task)' + ) + + parser.add_argument( + '-ptn', '--prob_test_noise', dest='test_noise', type=float, + required=True, help='Probability of encountering random noise sentence' + ) + + parser.add_argument( + '-tn', '--train_noise', dest='train_noise', type=bool, default=False, + help='Whether or not to include noise at training time' + ) + parser.add_argument( + '-ord', '--order', dest='order', type=int, default=-1, + help='The range of question orders' + ) + parser.add_argument( + '-len', '--length', dest='num_chapter', type=int, default=-1, + help='The range of story lengths' + ) + parser.add_argument( + '-t', '--tell', dest='exist_tell', type=bool, default=False, + help='Whether or not the story has communications between agents' + ) + parser.add_argument( + '-p', '--prompt', dest='prompt_type', type=str, default='CoT', + choices=['MC', 'CoT'], + help='The type of prompt chosen between MC and CoT' + ) + parser.add_argument( + '-a', '--answer', dest='exist_answer', type=bool, default=False, + help='Whether or not the data has answers' + ) + + parsed = parser.parse_args(args) + + return parsed + + +def main(args=sys.argv[1:]): + """Main function to generate all the story-question pairs.""" + args = parse_args(args) + logging.basicConfig( + level=args.logging, format='%(asctime)s\t%(levelname)-8s\t%(message)s' + ) + folder_name = 'Tell/' if args.exist_tell else 'No_Tell/' + + # folder_name += args.prompt_type + # output_dir_path = os.path.join(args.output_dir_path, folder_name) if args.exist_answer else os.path.join('prompt_ToMh', folder_name) + + output_dir_path = os.path.join(args.output_dir_path, folder_name) + + generate_story_with_specified_chapters( + world_paths=args.world_paths, + output_dir_path=output_dir_path, + n=args.num_stories_choices, + noise=args.test_noise, + train_noise=args.train_noise, + order=args.order, + num_chapter=args.num_chapter, + exist_tell_in_story=args.exist_tell, + prompt=args.prompt_type, + exist_answer=args.exist_answer, + ) + + +if __name__ == "__main__": + sys.exit(main()) diff --git a/ToMh_dataset/generate_tomh.sh b/ToMh_dataset/generate_tomh.sh new file mode 100644 index 0000000000000000000000000000000000000000..b71c85e05be2cdddd1fdd64235483f0ec08e66db --- /dev/null +++ b/ToMh_dataset/generate_tomh.sh @@ -0,0 +1,7 @@ +#!/bin/sh + +# Generate data +python3.10 create_world.py +python3.10 generate_tasks.py -w world_large.txt -n 20 -ptn=0.1 +python3.10 generate_tasks.py -w world_large.txt -n 20 -ptn=0.1 --tell True +python3.10 generate_prompts.py \ No newline at end of file diff --git a/ToMh_dataset/media/Picture1.png b/ToMh_dataset/media/Picture1.png new file mode 100644 index 0000000000000000000000000000000000000000..fc5e7080928a6e5c69eb1aac80ab216d5b0efdb1 --- /dev/null +++ b/ToMh_dataset/media/Picture1.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:438a35c66e09b2a1e5d973e7099134293b1c28c888aee34094dc67d939642dae +size 1033816 diff --git a/ToMh_dataset/oracle.py b/ToMh_dataset/oracle.py new file mode 100644 index 0000000000000000000000000000000000000000..36a134872579156e9c24a3ec2ecdf59f79d75cec --- /dev/null +++ b/ToMh_dataset/oracle.py @@ -0,0 +1,147 @@ +""" +The Oracle class keeps track of all object +and agent locations as well as a map of +beliefs about object and agent locations. +""" +import copy + +class LocationMap(object): + + def __init__(self, agents, locations, objects, containers): + + # Maps agents to their locations. + self.locations = {agent : None for agent in agents} + + # Maps agents to their locations. + self.container_locations = {container : None for container in containers} + + # Maps locations to their containers + self.containers = {location : None for location in locations} + + # Maps containers to the objects they hold + self.container_objs = {container : [] for container in containers} + + # Maps objects to their containers + self.obj_containers = {obj : None for obj in objects} + +class MemoryMap(object): + + def __init__(self, agents, objects): + + zero_dict = {obj : None for obj in objects} + first_dict = {agent : copy.deepcopy(zero_dict) for agent in agents} + second_dict = {agent : copy.deepcopy(first_dict) for agent in agents} + third_dict = {agent : copy.deepcopy(second_dict) for agent in agents} + fourth_dict = {agent : copy.deepcopy(third_dict) for agent in agents} + + # Dictionary of dictionaries mapping + # agents to objects to containers. Represents + # agents' belief about location of containers. + self.first_belief = copy.deepcopy(first_dict) + + # Dictionary of dictionaries of dictionaries + # mapping agents to direct belief dictionaries. + # Represents agents' belief about other agents' + # beliefs about location of containers. + self.second_belief = copy.deepcopy(second_dict) + self.third_belief = copy.deepcopy(third_dict) + self.fourth_belief = copy.deepcopy(fourth_dict) + +class Oracle(object): + + def __init__(self, agents, locations, objects, containers): + self.memory_map = MemoryMap(agents, objects) + self.locations = LocationMap(agents, locations, objects, containers) + + ######################################### + ################ Beliefs ################ + ######################################### + + def get_first_belief(self, agent, obj): + beliefs = self.memory_map.first_belief + return beliefs[agent][obj] + + def set_first_belief(self, agent, obj, container): + beliefs = self.memory_map.first_belief + beliefs[agent][obj] = container + + def get_second_belief(self, a1, a2, obj): + second_belief = self.memory_map.second_belief + return second_belief[a1][a2][obj] + + def set_second_belief(self, a1, a2, obj, container): + second_belief = self.memory_map.second_belief + second_belief[a1][a2][obj] = container + + def get_third_belief(self, a1, a2, a3, obj): + third_belief = self.memory_map.third_belief + return third_belief[a1][a2][a3][obj] + + def set_third_belief(self, a1, a2, a3, obj, container): + third_belief = self.memory_map.third_belief + third_belief[a1][a2][a3][obj] = container + + def get_fourth_belief(self, a1, a2, a3, a4, obj): + fourth_belief = self.memory_map.fourth_belief + return fourth_belief[a1][a2][a3][a4][obj] + + def set_fourth_belief(self, a1, a2, a3, a4, obj, container): + fourth_belief = self.memory_map.fourth_belief + fourth_belief[a1][a2][a3][a4][obj] = container + + ######################################### + ############### Locations ############### + ######################################### + + def get_location(self, agent): + return self.locations.locations[agent] + + def set_location(self, agent, location): + self.locations.locations[agent] = location + + def get_containers(self, location): + # Returns a list of containers at location + return self.locations.containers[location] + + def set_containers(self, location, containers): + # May need to change to move containers bt locs + # Containers is a list of containers at location + for container in containers: + self._set_container_location(container, location) + self.locations.containers[location] = containers + + def get_objects_at_location(self, location): + objects = [] + for container in self.get_containers(location): + objects.extend(self.get_container_obj(container)) + return objects + + def get_container_location(self, container): + return self.locations.container_locations[container] + + def _set_container_location(self, container, location): + self.locations.container_locations[container] = location + + def get_container_obj(self, container): + # get list of objects in container + return self.locations.container_objs[container] + + def _add_container_obj(self, container, obj): + self.locations.container_objs[container].append(obj) + + def _remove_container_obj(self, container, obj): + self.locations.container_objs[container].remove(obj) + + def get_object_container(self, obj): + # get container that holds object + return self.locations.obj_containers[obj] + + def set_object_container(self, obj, container): + # set container that holds object + prev_container = self.get_object_container(obj) + if prev_container: + self._remove_container_obj(prev_container, obj) + self._add_container_obj(container, obj) + self.locations.obj_containers[obj] = container + + \ No newline at end of file diff --git a/ToMh_dataset/stringify.py b/ToMh_dataset/stringify.py new file mode 100644 index 0000000000000000000000000000000000000000..4e7c98edff6f8e48cd57a8d9564713def8c5e0c3 --- /dev/null +++ b/ToMh_dataset/stringify.py @@ -0,0 +1,47 @@ +import numpy as np + + +def stringify(story, exist_answer=False, order=0): # exist_answer is dummy + + lines = [] + + i = 0 # The number of descriptions processed + j = 0 # The number of lines output + count_order = 0 + + while True: + + + if isinstance(story[i], str): + line = story[i] + else: + line = story[i].render() + # Capitalize the line + line = line[0].upper() + line[1:] + + # Prepend the line number + if line.split()[0] != 'Question:' and line.split()[0] != 'Choices:': + line = '%d %s' % (i + 1, line) + else: # Start with 'Choice' + if line.split()[0] == 'Choices:': + lines.append(line) + break + else: # Start with 'Question' + if count_order == order: + lines.append(line) + count_order += 1 + i += 1 + continue + lines.append(line) + # Increment counters + i += 1 + + # Append supporting lines indices if necessary + # if hasattr(story[i], 'idx_support') and story[i].idx_support: + # line += '\t%s' % ' '.join([str(x + 1) + # for x in story[i].idx_support]) + + if i >= len(story): + break + + return lines diff --git a/ToMh_dataset/tasks.py b/ToMh_dataset/tasks.py new file mode 100644 index 0000000000000000000000000000000000000000..9bfda058dc0b6446b6e1315ba189bf755eea97e1 --- /dev/null +++ b/ToMh_dataset/tasks.py @@ -0,0 +1,518 @@ +import numpy as np +import random +import copy + +from clause import Clause, Question +from oracle import Oracle +from dynamic_actions import * +from collections import defaultdict + + +def sample_question(oracle_start_state, oracle, random_actors, obj, question_idx=0): + idx_dummy = [0] + a1, a2, a3, a4, _ = random_actors + questions = [Question(idx_dummy, ZeroQ(oracle, obj)), + Question(idx_dummy, FirstQ(oracle, a4, obj)), + Question(idx_dummy, SecondQ(oracle, a3, a4, obj)), + Question(idx_dummy, ThirdQ(oracle, a2, a3, a4, obj)), + Question(idx_dummy, FourthQ(oracle, a1, a2, a3, a4, obj))] + return questions[question_idx] + +####################################### +############## Chapters ############### +####################################### + + +def write_A2_chapter( + start_state, oracle, obj, location, agent_ids, all_agents, movements=None, exist_tell=False, questions=None +): + a1, a2 = all_agents[agent_ids[0]], all_agents[agent_ids[1]] + outsiders = [agent for agent in all_agents if agent not in [a1, a2]] + agent_ids = [aid+1 for aid in agent_ids] + + # Pick containers. The first element is the initial container of obj + containers = [oracle.get_object_container(obj)] + container_candidates = oracle.get_containers(location)[:] + container_candidates.remove(containers[0]) + containers += random.sample(container_candidates, 2) + + # Fill in the chapter + chapter = [] + + # All selected agents enter the room and see the object + chapter.extend([ + Clause(EnterAction(oracle, (a1, a2, location))), + Clause(ObjectLocAction(oracle, obj, [a1, a2])), + ]) + + # a1 + chapter.extend([ + Clause(MoveAction(oracle, (a1, obj, containers[1]), [ + a2], move=movements[0])), + Clause(ExitedAction(oracle, (a1))) + ]) + # a2 + chapter.extend([ + Clause(MoveAction( + oracle, (a2, obj, containers[2]), None, move=movements[1])), + Clause(ExitedAction(oracle, (a2))) + ]) + + # Everyone enter the waiting room + chapter.extend([ + Clause(EnterAction(oracle, (a1, a2, 'waiting_room'))) + ]) + + # tell actions has 3 different forms + if exist_tell: + tell_containers = random.sample(oracle.get_containers(location)[:], 2) + tell_form = random.choice( + range(3)) if outsiders else random.choice(range(2)) + match tell_form: + case 0: + chapter.extend([ + Clause(PublicTellAction( + oracle, a1, obj, tell_containers[0], listeners=all_agents, believers=outsiders)), + Clause(PrivateTellAction(oracle, a2, a1, + obj, tell_containers[1], trust=True)), + ]) + case 1: + chapter.extend([ + Clause(PublicTellAction( + oracle, a2, obj, tell_containers[0], listeners=all_agents, believers=[a1] + outsiders)), + Clause(PrivateTellAction(oracle, a1, a2, obj, + tell_containers[1], trust=False)), + ]) + case 2: + chapter.extend([ + Clause(PrivateTellAction(oracle, a1, random.choice(outsiders), + obj, tell_containers[0], trust=True)) + ]) + return chapter + + +def write_A3_chapter( + start_state, oracle, obj, location, agent_ids, all_agents, movements=None, exist_tell=False, questions=None +): + a1, a2, a3 = all_agents[agent_ids[0] + ], all_agents[agent_ids[1]], all_agents[agent_ids[2]] + outsiders = [agent for agent in all_agents if agent not in [a1, a2, a3]] + agent_ids = [aid+1 for aid in agent_ids] + + # Pick containers. The first element is the initial container of obj + containers = [oracle.get_object_container(obj)] + container_candidates = oracle.get_containers(location)[:] + container_candidates.remove(containers[0]) + containers += random.sample(container_candidates, 3) + + # Fill in the chapter + chapter = [] + + # All selected agents enter the room and see the object + chapter.extend([ + Clause(EnterAction(oracle, (a1, a2, a3, location))), + Clause(ObjectLocAction(oracle, obj, [a1, a2, a3])), + ]) + + # a1 + chapter.extend([ + Clause(MoveAction(oracle, (a1, obj, containers[1]), [ + a2, a3], move=movements[0])), + Clause(ExitedAction(oracle, (a1))) + ]) + # a2 + chapter.extend([ + Clause(MoveAction(oracle, (a2, obj, containers[2]), [ + a3], move=movements[1])), + Clause(ExitedAction(oracle, (a2))) + ]) + # a3 + chapter.extend([ + Clause(MoveAction( + oracle, (a3, obj, containers[3]), None, move=movements[2])), + Clause(ExitedAction(oracle, (a3))) + ]) + + # Everyone enter the waiting room + chapter.extend([ + Clause(EnterAction(oracle, (a1, a2, a3, 'waiting_room'))) + ]) + + # tell actions has 4 different forms + if exist_tell: + tell_containers = random.sample(oracle.get_containers(location)[:], 2) + tell_form = random.choice( + range(4)) if outsiders else random.choice(range(2)) + match tell_form: + case 0: + # a2 lies to all, and a3 lies to a2 + chapter.extend([ + Clause(PublicTellAction( + oracle, a2, obj, tell_containers[0], listeners=all_agents, believers=[a1] + outsiders)), + Clause(PrivateTellAction(oracle, a3, a2, + obj, tell_containers[1], trust=True)), + ]) + case 1: + # a3 lies to all, and a1 lies to a3 + chapter.extend([ + Clause(PublicTellAction( + oracle, a3, obj, tell_containers[0], listeners=all_agents, believers=[a1, a2] + outsiders)), + Clause(PrivateTellAction(oracle, a1, a3, obj, + tell_containers[1], trust=False)), + ]) + case 2: + # a1 lies to all, but a3 tells the true location to an outside agent + chapter.extend([ + Clause(PublicTellAction( + oracle, a1, obj, tell_containers[0], listeners=all_agents, believers=outsiders)), + Clause(PrivateTellAction(oracle, a3, random.choice(outsiders), + obj, oracle.get_object_container(obj), trust=True)) + ]) + case 3: + # a2 lies to a3, but a3 tells the true location to an outside agent + chapter.extend([ + Clause(PrivateTellAction(oracle, a2, a3, + obj, tell_containers[0], trust=False)), + Clause(PrivateTellAction(oracle, a3, random.choice(outsiders), + obj, oracle.get_object_container(obj), trust=True)) + ]) + return chapter + + +def write_A4_chapter( + start_state, oracle, obj, location, agent_ids, all_agents, movements=None, exist_tell=False, questions=None +): + a1, a2, a3, a4 = all_agents[agent_ids[0] + ], all_agents[agent_ids[1]], all_agents[agent_ids[2]], all_agents[agent_ids[3]] + outsiders = [ + agent for agent in all_agents if agent not in [a1, a2, a3, a4]] + agent_ids = [aid+1 for aid in agent_ids] + + # Pick containers. The first element is the initial container of obj + containers = [oracle.get_object_container(obj)] + container_candidates = oracle.get_containers(location)[:] + container_candidates.remove(containers[0]) + containers += random.sample(container_candidates, 4) + + # Fill in the chapter + chapter = [] + + # All selected agents enter the room and see the object + chapter.extend([ + Clause(EnterAction(oracle, (a1, a2, a3, a4, location))), + Clause(ObjectLocAction(oracle, obj, [a1, a2, a3, a4])), + ]) + + # a1 + chapter.extend([ + Clause(MoveAction(oracle, (a1, obj, containers[1]), [ + a2, a3, a4], move=movements[0])), + Clause(ExitedAction(oracle, (a1))) + ]) + # a2 + chapter.extend([ + Clause(MoveAction(oracle, (a2, obj, containers[2]), [ + a3, a4], move=movements[1])), + Clause(ExitedAction(oracle, (a2))) + ]) + # a3 + chapter.extend([ + Clause(MoveAction(oracle, (a3, obj, containers[3]), [ + a4], move=movements[2])), + Clause(ExitedAction(oracle, (a3))) + ]) + # a4 + chapter.extend([ + Clause(MoveAction( + oracle, (a4, obj, containers[4]), None, move=movements[3])), + Clause(ExitedAction(oracle, (a4))) + ]) + + # Everyone enter the waiting room + chapter.extend([ + Clause(EnterAction(oracle, (a1, a2, a3, a4, 'waiting_room'))) + ]) + + # tell actions has 4 different forms + if exist_tell: + tell_containers = random.sample(oracle.get_containers(location)[:], 2) + tell_form = random.choice( + range(4)) if outsiders else random.choice(range(2)) + match tell_form: + case 0: + # a2 lies to all, and a3 lies to a2 + chapter.extend([ + Clause(PublicTellAction( + oracle, a2, obj, tell_containers[0], listeners=all_agents, believers=[a1] + outsiders)), + Clause(PrivateTellAction(oracle, a4, a3, + obj, tell_containers[1], trust=True)), + ]) + case 1: + # a3 lies to all, and a1 lies to a4 + chapter.extend([ + Clause(PublicTellAction( + oracle, a3, obj, tell_containers[0], listeners=all_agents, believers=[a1, a2] + outsiders)), + Clause(PrivateTellAction(oracle, a1, a4, obj, + tell_containers[1], trust=False)), + ]) + case 2: + outsider = random.choice(outsiders) + # a1 lies to all, but a4 tells the true location to an outside agent + chapter.extend([ + Clause(PublicTellAction( + oracle, a1, obj, tell_containers[0], listeners=all_agents, believers=outsiders)), + Clause(PrivateTellAction(oracle, a4, outsider, + obj, oracle.get_object_container(obj), trust=True)) + ]) + case 3: + outsider = random.choice(outsiders) + # a2 lies to a3, but a4 tells the true location to an outside agent + chapter.extend([ + Clause(PrivateTellAction(oracle, a2, a3, + obj, tell_containers[0], trust=False)), + Clause(PrivateTellAction(oracle, a4, outsider, + obj, oracle.get_object_container(obj), trust=True)) + ]) + return chapter + + +def write_A5_chapter( + start_state, oracle, obj, location, agent_ids, all_agents, movements=None, exist_tell=False, questions=None +): + a1, a2, a3, a4, a5 = all_agents[agent_ids[0]], all_agents[agent_ids[1] + ], all_agents[agent_ids[2]], all_agents[agent_ids[3]], all_agents[agent_ids[4]] + agent_ids = [aid+1 for aid in agent_ids] + + # Pick containers. The first element is the initial container of obj + containers = [oracle.get_object_container(obj)] + container_candidates = oracle.get_containers(location)[:] + container_candidates.remove(containers[0]) + containers += random.sample(container_candidates, 4) + + # Fill in the chapter + chapter = [] + + # All selected agents enter the room and see the object + chapter.extend([ + Clause(EnterAction(oracle, (a1, a2, a3, a4, a5, location))), + Clause(ObjectLocAction(oracle, obj, [a1, a2, a3, a4, a5])), + ]) + + # a1 + chapter.extend([ + Clause(MoveAction(oracle, (a1, obj, containers[1]), [ + a2, a3, a4, a5], move=movements[0])), + Clause(ExitedAction(oracle, (a1))) + ]) + # a2 + chapter.extend([ + Clause(MoveAction(oracle, (a2, obj, containers[2]), [ + a3, a4, a5], move=movements[1])), + Clause(ExitedAction(oracle, (a2))) + ]) + # a3 + chapter.extend([ + Clause(MoveAction(oracle, (a3, obj, containers[3]), [ + a4, a5], move=movements[2])), + Clause(ExitedAction(oracle, (a3))) + ]) + # a4 + chapter.extend([ + Clause(MoveAction(oracle, (a4, obj, containers[4]), [ + a5], move=movements[3])), + Clause(ExitedAction(oracle, (a4))) + ]) + # a5 + chapter.extend([ + Clause(MoveAction( + oracle, (a5, obj, containers[0]), None, move=movements[4])), + Clause(ExitedAction(oracle, (a5))) + ]) + + # Everyone enter the waiting room + chapter.extend([ + Clause(EnterAction(oracle, (a1, a2, a3, a4, a5, 'waiting_room'))) + ]) + + # tell actions has 3 different forms + if exist_tell: + tell_containers = random.sample(oracle.get_containers(location)[:], 2) + tell_form = random.choice(range(3)) + match tell_form: + case 0: + # a3 lies to all, and a5 lies to a3 + chapter.extend([ + Clause(PublicTellAction( + oracle, a3, obj, tell_containers[0], listeners=all_agents, believers=[a1, a2])), + Clause(PrivateTellAction(oracle, a5, a3, + obj, tell_containers[1], trust=True)), + ]) + case 1: + # a4 lies to all, but a5 tells the true location to a1 + chapter.extend([ + Clause(PublicTellAction( + oracle, a4, obj, tell_containers[0], listeners=all_agents, believers=[a1, a2, a3])), + Clause(PrivateTellAction(oracle, a5, a1, obj, + oracle.get_object_container(obj), trust=True)), + ]) + case 2: + # a3 lies a1, and a2 lies to a4 + chapter.extend([ + Clause(PrivateTellAction(oracle, a3, a1, + obj, tell_containers[0], trust=True)) + ]) + return chapter + + +####################################### +############### Tasks ################# +####################################### + +class Task(object): + + def __init__(self, + num_questions=5, + exit_prob=1., + informant_prob=1., + search_prob=1., + test_cond='first order'): + + self.num_questions = num_questions + + self.search_prob = search_prob + + self.exit_inform_probs = [1 - exit_prob, + exit_prob * (1 - informant_prob), + exit_prob * informant_prob] + assert sum(self.exit_inform_probs) == 1 + + assert test_cond in ['first order', + 'second order', + 'reality', + 'memory'], \ + "Invalid test condition: %s" % test_cond + self.test_cond = test_cond + + def generate_story(self, world): + raise NotImplementedError("Abstract method.") + + +class Specify_Tasks(Task): + def generate_story_qs_at_end( + self, world, tasks_per_story, tasks, num_agents=5, + num_locations=3, statement_noise=0.1, order=0, exist_tell_in_story=False + ): + """ + Allows user to specify chapter and question for each task in story. + + :tasks: list with length of tasks per story. Each entry is a string in + the set {'tb','fb','sofb'} + + :questions: list with length of tasks per story. Each entry is a string + in the set {'memory', 'reality', 'belief', 'search'} + + :statement_noise: probability of encountering noise sentence like 'The + dog ran through the kitchen.' + """ + + # Fetch agents and objects and select a random subset + idx_support_dummy = [0] + actors = world.get_actors() + locations = world.get_locations() + objects = world.get_objects() + containers = world.get_containers() + + random_actors = np.random.choice( + actors, size=num_agents, replace=False + ) + random_locations = np.random.choice( + locations, size=num_locations, replace=False + ) + random_objects = np.random.choice( + objects, size=num_locations*2, replace=False + ) + random_containers = np.random.choice( + containers, size=num_locations*5, replace=False + ) + + # Create the oracle + oracle = Oracle( + random_actors, random_locations, random_objects, random_containers + ) + + # Populate locations in the oracle with containers + for i, random_location in enumerate(random_locations): + location = random_location + containers = random_containers[5*i:5*i+5] + oracle.set_containers(location, list(containers)) + # Two of the containers have objects + oracle.set_object_container( + random_objects[2*i], containers[0]) + oracle.set_object_container( + random_objects[2*i+1], containers[1]) + + # Need start state for memory question + start_state = oracle.locations.obj_containers.copy() + + # Create story by task + chapters = {'A2': write_A2_chapter, + 'A3': write_A3_chapter, + 'A4': write_A4_chapter, + 'A5': write_A5_chapter} + story = [] + obj_pool = [] + obj_in_question = None + + for i in range(tasks_per_story): + chapter = chapters[tasks[i][0]] + location = np.random.choice(random_locations) + obj = np.random.choice(oracle.get_objects_at_location(location)) + # Use the obj in the first chap as the target + if i == 0: + obj_in_question = obj + obj_pool.append(obj) + agent_ids = list(range(5)) + random.shuffle(agent_ids) + + # Randomly choose movements for each agent + agent_num = int(tasks[i][0][1]) + bools = [True, False] + movements = [random.choice(bools) for _ in range(agent_num)] + exist_tell_in_chapter = tasks[i][1] if exist_tell_in_story else False + story.extend( + chapter( + start_state, oracle, obj, location, agent_ids, random_actors, movements=movements, exist_tell=exist_tell_in_chapter + ) + ) + + # At the end, add noise sentences randomly + if statement_noise: + noisy_story = [] + prev_i = 0 + noise = [i for i + in range(len(story)) if np.random.rand() < statement_noise + ] + for i in noise: + noisy_story.extend( + story[prev_i:i] + + [Clause(NoiseAction(random_actors, + random_containers, random_objects))] + ) + prev_i = i + noisy_story.extend(story[prev_i:]) + + # compute questions of all orders + questioned_actors = copy.deepcopy(random_actors) + random.shuffle(questioned_actors) + for idx in range(5): + noisy_story.append( + sample_question( + start_state, oracle, questioned_actors, obj_in_question, question_idx=idx + ) + ) + + # Generate choices of containers + choices = ', '.join(f'{chr(65+i)}. {container}' for i, + container in enumerate(random_containers)) + noisy_story.append('Choices: ' + choices + '\n') + return noisy_story diff --git a/ToMh_dataset/test_azure.py b/ToMh_dataset/test_azure.py new file mode 100644 index 0000000000000000000000000000000000000000..7575868d6814a73c9bc8a5996c635c5a31e816c9 --- /dev/null +++ b/ToMh_dataset/test_azure.py @@ -0,0 +1,43 @@ +import os +import openai + +def record_progress(filename): + with open('progress.txt', 'a') as f: + f.write(filename + '\n') + +def is_processed(filename): + with open('progress.txt', 'r') as f: + processed_files = f.read().splitlines() + return filename in processed_files + +openai.api_type = "azure" +openai.api_base = "https://openaiserviceforclausaeu.openai.azure.com/" +openai.api_version = "2023-03-15-preview" +openai.api_key = os.getenv("OPENAI_API_KEY") + +test_dirs = os.listdir("prompt_ToMh") +for test_dir in test_dirs: + test_fns = os.listdir(f"prompt_ToMh/{test_dir}") + for test_fn in test_fns: + full_path = f"prompt_ToMh/{test_dir}/{test_fn}" + if is_processed(full_path): + continue + print(test_fn) + print(f"path: {full_path}") + with open(full_path, 'r') as f: + input = f.readlines() + input = "\n".join([inp.strip() for inp in input]) + response = openai.ChatCompletion.create( + engine="gpt4-32k", + messages=[ + {"role":"system","content":"You are an AI assistant that helps people find information."}, + {"role":"user","content": input} + ], + temperature=0, + max_tokens=800, + top_p=0, + frequency_penalty=0, + presence_penalty=0, + stop=None) + print(response) + record_progress(full_path) diff --git a/ToMh_dataset/utils.py b/ToMh_dataset/utils.py new file mode 100644 index 0000000000000000000000000000000000000000..bb2d04be81d789fa39f7de0e7dd6d74a8b0c11f6 --- /dev/null +++ b/ToMh_dataset/utils.py @@ -0,0 +1,44 @@ +from argparse import ArgumentTypeError +import errno +import os + + +class Error(Exception): + """Base class for exceptions in this module.""" + pass + + +class InputError(Error): + """Exception raised for errors in the input. + + Attributes: + expr # input expression in which the error occurred + msg # explanation of the error + """ + + def __init__(self, expr, msg): + self.expr = expr + self.msg = msg + + +def is_file(f): + try: + open(f, 'r') # return an open file handle + except IOError: + raise ArgumentTypeError("{0} does not exist".format(f)) + return f + + +def mkdir_p(path): + try: + os.makedirs(path) + except OSError as exc: # Python >2.5 + if exc.errno == errno.EEXIST and os.path.isdir(path): + pass + else: + raise + return path + + +def remove_extension(path): + return os.path.splitext(os.path.basename(path))[0] diff --git a/ToMh_dataset/world.py b/ToMh_dataset/world.py new file mode 100644 index 0000000000000000000000000000000000000000..b3959806174624f0ba8c6f40bfdebb992f3f265b --- /dev/null +++ b/ToMh_dataset/world.py @@ -0,0 +1,47 @@ +class World(object): + + def __init__(self, world_actions=[], entities={}): + self.actions = world_actions + self.entities = entities + + def load(self, fname): + + lines = open(fname, 'r').readlines() + i = 0 + + while i < len(lines): + line = lines[i].rstrip('\n') + if line != '' and not line.startswith('#'): + if line.startswith('create'): + self.entities[line.split(' ')[1]] = {} + elif line.startswith('set'): + self.entities[line.split(' ')[1]][line.split(' ')[-1]] = True + + i += 1 + + def get_entity(self, predicates): + + if not isinstance(predicates, list): + raise InputError(predicates, 'is not a list.') + + return_val = [] + + for k in self.entities: + if all([predicate in self.entities[k] and + self.entities[k][predicate] is True + for predicate in predicates]): + return_val += [k] + + return return_val + + def get_actors(self): + return self.get_entity(['is_actor', 'is_god']) + + def get_containers(self): + return self.get_entity(['is_thing', 'is_container']) + + def get_locations(self): + return self.get_entity(['is_location']) + + def get_objects(self): + return self.get_entity(['is_thing', 'is_gettable']) diff --git a/ToMh_dataset/world_large.txt b/ToMh_dataset/world_large.txt new file mode 100644 index 0000000000000000000000000000000000000000..622d7d6603b43534b2f5113874698317beed505b --- /dev/null +++ b/ToMh_dataset/world_large.txt @@ -0,0 +1,487 @@ +# locations + +create kitchen +set kitchen is_thing +set kitchen is_location + +create crawlspace +set crawlspace is_thing +set crawlspace is_location + +create laundry +set laundry is_thing +set laundry is_location + +create bathroom +set bathroom is_thing +set bathroom is_location + +create bedroom +set bedroom is_thing +set bedroom is_location + +create den +set den is_thing +set den is_location + +create hall +set hall is_thing +set hall is_location + +create pantry +set pantry is_thing +set pantry is_location + +create study +set study is_thing +set study is_location + +create front_yard +set front_yard is_thing +set front_yard is_location + +create closet +set closet is_thing +set closet is_location + +create sunroom +set sunroom is_thing +set sunroom is_location + +create TV_room +set TV_room is_thing +set TV_room is_location + +create dining_room +set dining_room is_thing +set dining_room is_location + +create garden +set garden is_thing +set garden is_location + +create office +set office is_thing +set office is_location + +create master_bedroom +set master_bedroom is_thing +set master_bedroom is_location + +create playroom +set playroom is_thing +set playroom is_location + +create patio +set patio is_thing +set patio is_location + +create porch +set porch is_thing +set porch is_location + +create cellar +set cellar is_thing +set cellar is_location + +create workshop +set workshop is_thing +set workshop is_location + +create hallway +set hallway is_thing +set hallway is_location + +create back_yard +set back_yard is_thing +set back_yard is_location + +create attic +set attic is_thing +set attic is_location + +create basement +set basement is_thing +set basement is_location + +create lounge +set lounge is_thing +set lounge is_location + +create living_room +set living_room is_thing +set living_room is_location + +create garage +set garage is_thing +set garage is_location + +create staircase +set staircase is_thing +set staircase is_location + +# objects + +create green_pepper +set green_pepper is_thing +set green_pepper is_gettable + +create cabbage +set cabbage is_thing +set cabbage is_gettable + +create corn +set corn is_thing +set corn is_gettable + +create eggplant +set eggplant is_thing +set eggplant is_gettable + +create cucumber +set cucumber is_thing +set cucumber is_gettable + +create pineapple +set pineapple is_thing +set pineapple is_gettable + +create pear +set pear is_thing +set pear is_gettable + +create asparagus +set asparagus is_thing +set asparagus is_gettable + +create strawberry +set strawberry is_thing +set strawberry is_gettable + +create celery +set celery is_thing +set celery is_gettable + +create watermelon +set watermelon is_thing +set watermelon is_gettable + +create potato +set potato is_thing +set potato is_gettable + +create radish +set radish is_thing +set radish is_gettable + +create carrot +set carrot is_thing +set carrot is_gettable + +create plum +set plum is_thing +set plum is_gettable + +create peach +set peach is_thing +set peach is_gettable + +create broccoli +set broccoli is_thing +set broccoli is_gettable + +create grapefruit +set grapefruit is_thing +set grapefruit is_gettable + +create banana +set banana is_thing +set banana is_gettable + +create apple +set apple is_thing +set apple is_gettable + +create turnip +set turnip is_thing +set turnip is_gettable + +create grapes +set grapes is_thing +set grapes is_gettable + +create cherry +set cherry is_thing +set cherry is_gettable + +create persimmon +set persimmon is_thing +set persimmon is_gettable + +create spinach +set spinach is_thing +set spinach is_gettable + +create tomato +set tomato is_thing +set tomato is_gettable + +create sweet_potato +set sweet_potato is_thing +set sweet_potato is_gettable + +create pumpkin +set pumpkin is_thing +set pumpkin is_gettable + +create tangerine +set tangerine is_thing +set tangerine is_gettable + +create onion +set onion is_thing +set onion is_gettable + +# containers + +create red_bathtub +set red_bathtub is_thing +set red_bathtub is_container + +create blue_crate +set blue_crate is_thing +set blue_crate is_container + +create green_bottle +set green_bottle is_thing +set green_bottle is_container + +create red_basket +set red_basket is_thing +set red_basket is_container + +create green_bathtub +set green_bathtub is_thing +set green_bathtub is_container + +create green_container +set green_container is_thing +set green_container is_container + +create blue_suitcase +set blue_suitcase is_thing +set blue_suitcase is_container + +create blue_cupboard +set blue_cupboard is_thing +set blue_cupboard is_container + +create blue_bucket +set blue_bucket is_thing +set blue_bucket is_container + +create red_envelope +set red_envelope is_thing +set red_envelope is_container + +create red_treasure_chest +set red_treasure_chest is_thing +set red_treasure_chest is_container + +create red_pantry +set red_pantry is_thing +set red_pantry is_container + +create red_bottle +set red_bottle is_thing +set red_bottle is_container + +create blue_drawer +set blue_drawer is_thing +set blue_drawer is_container + +create green_crate +set green_crate is_thing +set green_crate is_container + +create green_treasure_chest +set green_treasure_chest is_thing +set green_treasure_chest is_container + +create green_basket +set green_basket is_thing +set green_basket is_container + +create red_box +set red_box is_thing +set red_box is_container + +create green_pantry +set green_pantry is_thing +set green_pantry is_container + +create green_suitcase +set green_suitcase is_thing +set green_suitcase is_container + +create blue_envelope +set blue_envelope is_thing +set blue_envelope is_container + +create blue_pantry +set blue_pantry is_thing +set blue_pantry is_container + +create green_bucket +set green_bucket is_thing +set green_bucket is_container + +create red_suitcase +set red_suitcase is_thing +set red_suitcase is_container + +create red_crate +set red_crate is_thing +set red_crate is_container + +create green_envelope +set green_envelope is_thing +set green_envelope is_container + +create blue_container +set blue_container is_thing +set blue_container is_container + +create blue_treasure_chest +set blue_treasure_chest is_thing +set blue_treasure_chest is_container + +create blue_box +set blue_box is_thing +set blue_box is_container + +create blue_bathtub +set blue_bathtub is_thing +set blue_bathtub is_container + +# actors + +create Benjamin +set Benjamin is_actor +set Benjamin is_god + +create Mila +set Mila is_actor +set Mila is_god + +create Mason +set Mason is_actor +set Mason is_god + +create Jayden +set Jayden is_actor +set Jayden is_god + +create Aiden +set Aiden is_actor +set Aiden is_god + +create Isla +set Isla is_actor +set Isla is_god + +create Jack +set Jack is_actor +set Jack is_god + +create Aria +set Aria is_actor +set Aria is_god + +create Ethan +set Ethan is_actor +set Ethan is_god + +create Isabella +set Isabella is_actor +set Isabella is_god + +create Nathan +set Nathan is_actor +set Nathan is_god + +create William +set William is_actor +set William is_god + +create Jackson +set Jackson is_actor +set Jackson is_god + +create Alexander +set Alexander is_actor +set Alexander is_god + +create Liam +set Liam is_actor +set Liam is_god + +create Elizabeth +set Elizabeth is_actor +set Elizabeth is_god + +create Evelyn +set Evelyn is_actor +set Evelyn is_god + +create Amelia +set Amelia is_actor +set Amelia is_god + +create Ava +set Ava is_actor +set Ava is_god + +create Emily +set Emily is_actor +set Emily is_god + +create Hannah +set Hannah is_actor +set Hannah is_god + +create Ella +set Ella is_actor +set Ella is_god + +create Emma +set Emma is_actor +set Emma is_god + +create Carter +set Carter is_actor +set Carter is_god + +create Gracie +set Gracie is_actor +set Gracie is_god + +create Charlotte +set Charlotte is_actor +set Charlotte is_god + +create Lucas +set Lucas is_actor +set Lucas is_god + +create Sophia +set Sophia is_actor +set Sophia is_god + +create Lily +set Lily is_actor +set Lily is_god + +create Abigail +set Abigail is_actor +set Abigail is_god diff --git a/ToMh_dataset/world_small.txt b/ToMh_dataset/world_small.txt new file mode 100644 index 0000000000000000000000000000000000000000..bb45a360c8e0659b5ce5fe8fe28bb71c29ed20e0 --- /dev/null +++ b/ToMh_dataset/world_small.txt @@ -0,0 +1,167 @@ +# locations + +create laundry +set laundry is_thing +set laundry is_location + +create master_bedroom +set master_bedroom is_thing +set master_bedroom is_location + +create crawlspace +set crawlspace is_thing +set crawlspace is_location + +create back_yard +set back_yard is_thing +set back_yard is_location + +create hall +set hall is_thing +set hall is_location + +create basement +set basement is_thing +set basement is_location + +create living_room +set living_room is_thing +set living_room is_location + +create patio +set patio is_thing +set patio is_location + +create sunroom +set sunroom is_thing +set sunroom is_location + +create garden +set garden is_thing +set garden is_location + +# objects + +create pear +set pear is_thing +set pear is_gettable + +create lime +set lime is_thing +set lime is_gettable + +create broccoli +set broccoli is_thing +set broccoli is_gettable + +create cucumber +set cucumber is_thing +set cucumber is_gettable + +create tomato +set tomato is_thing +set tomato is_gettable + +create orange +set orange is_thing +set orange is_gettable + +create lemon +set lemon is_thing +set lemon is_gettable + +create peach +set peach is_thing +set peach is_gettable + +create celery +set celery is_thing +set celery is_gettable + +create plum +set plum is_thing +set plum is_gettable + +# containers + +create blue_bathtub +set blue_bathtub is_thing +set blue_bathtub is_container + +create red_bottle +set red_bottle is_thing +set red_bottle is_container + +create blue_suitcase +set blue_suitcase is_thing +set blue_suitcase is_container + +create blue_bottle +set blue_bottle is_thing +set blue_bottle is_container + +create blue_pantry +set blue_pantry is_thing +set blue_pantry is_container + +create green_basket +set green_basket is_thing +set green_basket is_container + +create green_cupboard +set green_cupboard is_thing +set green_cupboard is_container + +create blue_container +set blue_container is_thing +set blue_container is_container + +create green_drawer +set green_drawer is_thing +set green_drawer is_container + +create red_suitcase +set red_suitcase is_thing +set red_suitcase is_container + +# actors + +create Nathan +set Nathan is_actor +set Nathan is_god + +create Alexander +set Alexander is_actor +set Alexander is_god + +create Abigail +set Abigail is_actor +set Abigail is_god + +create Jack +set Jack is_actor +set Jack is_god + +create Amelia +set Amelia is_actor +set Amelia is_god + +create Olivia +set Olivia is_actor +set Olivia is_god + +create Gracie +set Gracie is_actor +set Gracie is_god + +create Jacob +set Jacob is_actor +set Jacob is_god + +create Jayden +set Jayden is_actor +set Jayden is_god + +create Noah +set Noah is_actor +set Noah is_god diff --git a/ToMh_dataset/world_tiny.txt b/ToMh_dataset/world_tiny.txt new file mode 100644 index 0000000000000000000000000000000000000000..d60aab3c93e8574ca16106f0182d1fd658f59a4e --- /dev/null +++ b/ToMh_dataset/world_tiny.txt @@ -0,0 +1,87 @@ +# locations + +create office +set office is_thing +set office is_location + +create workshop +set workshop is_thing +set workshop is_location + +create bathroom +set bathroom is_thing +set bathroom is_location + +create back_yard +set back_yard is_thing +set back_yard is_location + +create basement +set basement is_thing +set basement is_location + +# objects + +create radish +set radish is_thing +set radish is_gettable + +create potato +set potato is_thing +set potato is_gettable + +create green_pepper +set green_pepper is_thing +set green_pepper is_gettable + +create apple +set apple is_thing +set apple is_gettable + +create melon +set melon is_thing +set melon is_gettable + +# containers + +create blue_container +set blue_container is_thing +set blue_container is_container + +create red_cupboard +set red_cupboard is_thing +set red_cupboard is_container + +create blue_suitcase +set blue_suitcase is_thing +set blue_suitcase is_container + +create red_crate +set red_crate is_thing +set red_crate is_container + +create red_suitcase +set red_suitcase is_thing +set red_suitcase is_container + +# actors + +create Owen +set Owen is_actor +set Owen is_god + +create Elizabeth +set Elizabeth is_actor +set Elizabeth is_god + +create James +set James is_actor +set James is_god + +create Jayden +set Jayden is_actor +set Jayden is_god + +create Hannah +set Hannah is_actor +set Hannah is_god